From e37890bc2d7972838c60d848143e7fb61315bb40 Mon Sep 17 00:00:00 2001
From: Willi Raschkowski <wraschkowski@palantir.com>
Date: Mon, 30 Dec 2024 14:56:10 +0100
Subject: [PATCH 1/3] Support 'entries' metadata table

---
 Cargo.lock                                    |  23 +
 crates/iceberg/Cargo.toml                     |   2 +
 crates/iceberg/src/arrow/schema.rs            | 187 +++++
 crates/iceberg/src/inspect/entries.rs         | 671 ++++++++++++++++++
 crates/iceberg/src/inspect/manifests.rs       |  74 +-
 crates/iceberg/src/inspect/metadata_table.rs  |  66 +-
 crates/iceberg/src/inspect/mod.rs             |   2 +
 crates/iceberg/src/inspect/snapshots.rs       |  59 +-
 crates/iceberg/src/scan.rs                    | 160 ++++-
 crates/iceberg/src/spec/manifest.rs           |   6 +
 .../testdata/example_table_metadata_v2.json   |  10 +-
 11 files changed, 1121 insertions(+), 139 deletions(-)
 create mode 100644 crates/iceberg/src/inspect/entries.rs
diff --git a/Cargo.lock b/Cargo.lock
index cf4a23df9..18f4ffed5 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -580,6 +580,28 @@ dependencies = [
  "wasm-bindgen-futures",
 ]
 
+[[package]]
+name = "async-stream"
+version = "0.3.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0b5a71a6f37880a80d1d7f19efd781e4b5de42c88f0722cc13bcb6cc2cfe8476"
+dependencies = [
+ "async-stream-impl",
+ "futures-core",
+ "pin-project-lite",
+]
+
+[[package]]
+name = "async-stream-impl"
+version = "0.3.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c7c24de15d275a1ecfd47a380fb4d5ec9bfe0933f309ed5e705b775596a3574d"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.96",
+]
+
 [[package]]
 name = "async-task"
 version = "4.7.1"
@@ -2947,6 +2969,7 @@ dependencies = [
  "arrow-select",
  "arrow-string",
  "async-std",
+ "async-stream",
  "async-trait",
  "bimap",
  "bitvec",
diff --git a/crates/iceberg/Cargo.toml b/crates/iceberg/Cargo.toml
index 7320c455d..64f6e3d64 100644
--- a/crates/iceberg/Cargo.toml
+++ b/crates/iceberg/Cargo.toml
@@ -53,6 +53,7 @@ arrow-schema = { workspace = true }
 arrow-select = { workspace = true }
 arrow-string = { workspace = true }
 async-std = { workspace = true, optional = true, features = ["attributes"] }
+async-stream = { workspace = true }
 async-trait = { workspace = true }
 bimap = { workspace = true }
 bitvec = { workspace = true }
@@ -86,6 +87,7 @@ uuid = { workspace = true }
 zstd = { workspace = true }
 
 [dev-dependencies]
+arrow-cast = { workspace = true, features = ["prettyprint"] }
 ctor = { workspace = true }
 expect-test = { workspace = true }
 iceberg-catalog-memory = { workspace = true }
diff --git a/crates/iceberg/src/arrow/schema.rs b/crates/iceberg/src/arrow/schema.rs
index f4eae018f..4928feb11 100644
--- a/crates/iceberg/src/arrow/schema.rs
+++ b/crates/iceberg/src/arrow/schema.rs
@@ -827,6 +827,193 @@ get_parquet_stat_as_datum!(min);
 
 get_parquet_stat_as_datum!(max);
 
+/// Utilities to deal with [arrow_array::builder] types in the Iceberg context.
+pub(crate) mod builder {
+    use arrow_array::builder::*;
+    use arrow_array::cast::AsArray;
+    use arrow_array::types::*;
+    use arrow_array::{ArrayRef, Datum as ArrowDatum};
+    use arrow_schema::{DataType, TimeUnit};
+    use ordered_float::OrderedFloat;
+
+    use crate::spec::{Literal, PrimitiveLiteral};
+    use crate::{Error, ErrorKind};
+
+    /// A helper wrapping [ArrayBuilder] for building arrays without declaring the inner type at
+    /// compile-time when types are determined dynamically (e.g. based on some column type).
+    /// A [DataType] is given at construction time which is used to later downcast the inner array
+    /// and provided values.
+    pub(crate) struct AnyArrayBuilder {
+        data_type: DataType,
+        inner: Box<dyn ArrayBuilder>,
+    }
+
+    impl AnyArrayBuilder {
+        pub(crate) fn new(data_type: &DataType) -> Self {
+            Self {
+                data_type: data_type.clone(),
+                inner: make_builder(data_type, 0),
+            }
+        }
+
+        pub(crate) fn finish(&mut self) -> ArrayRef {
+            self.inner.finish()
+        }
+
+        /// Append an [[arrow_array::Datum]] value.
+        pub(crate) fn append_datum(&mut self, value: &dyn ArrowDatum) -> crate::Result<()> {
+            let (array, is_scalar) = value.get();
+            assert!(is_scalar, "Can only append scalar datum");
+
+            match array.data_type() {
+                DataType::Boolean => self
+                    .builder::<BooleanBuilder>()?
+                    .append_value(array.as_boolean().value(0)),
+                DataType::Int32 => self
+                    .builder::<Int32Builder>()?
+                    .append_value(array.as_primitive::<Int32Type>().value(0)),
+                DataType::Int64 => self
+                    .builder::<Int64Builder>()?
+                    .append_value(array.as_primitive::<Int64Type>().value(0)),
+                DataType::Float32 => self
+                    .builder::<Float32Builder>()?
+                    .append_value(array.as_primitive::<Float32Type>().value(0)),
+                DataType::Float64 => self
+                    .builder::<Float64Builder>()?
+                    .append_value(array.as_primitive::<Float64Type>().value(0)),
+                DataType::Decimal128(_, _) => self
+                    .builder::<Decimal128Builder>()?
+                    .append_value(array.as_primitive::<Decimal128Type>().value(0)),
+                DataType::Date32 => self
+                    .builder::<Date32Builder>()?
+                    .append_value(array.as_primitive::<Date32Type>().value(0)),
+                DataType::Time64(TimeUnit::Microsecond) => self
+                    .builder::<Time64MicrosecondBuilder>()?
+                    .append_value(array.as_primitive::<Time64MicrosecondType>().value(0)),
+                DataType::Timestamp(TimeUnit::Microsecond, _) => self
+                    .builder::<TimestampMicrosecondBuilder>()?
+                    .append_value(array.as_primitive::<TimestampMicrosecondType>().value(0)),
+                DataType::Timestamp(TimeUnit::Nanosecond, _) => self
+                    .builder::<TimestampNanosecondBuilder>()?
+                    .append_value(array.as_primitive::<TimestampNanosecondType>().value(0)),
+                DataType::Utf8 => self
+                    .builder::<StringBuilder>()?
+                    .append_value(array.as_string::<i32>().value(0)),
+                DataType::FixedSizeBinary(_) => self
+                    .builder::<BinaryBuilder>()?
+                    .append_value(array.as_fixed_size_binary().value(0)),
+                DataType::LargeBinary => self
+                    .builder::<LargeBinaryBuilder>()?
+                    .append_value(array.as_binary::<i64>().value(0)),
+                _ => {
+                    return Err(Error::new(
+                        ErrorKind::FeatureUnsupported,
+                        format!("Cannot append data type: {:?}", array.data_type(),),
+                    ));
+                }
+            }
+            Ok(())
+        }
+
+        /// Append a literal with the provided [DataType]. We're not solely relying on the literal to
+        /// infer the type because [Literal] values do not specify the expected type of builder. E.g.,
+        /// a [PrimitiveLiteral::Long] may go into an array builder for longs but also for timestamps.
+        pub(crate) fn append_literal(&mut self, value: &Literal) -> crate::Result<()> {
+            let Some(primitive) = value.as_primitive_literal() else {
+                return Err(Error::new(
+                    ErrorKind::FeatureUnsupported,
+                    "Expected primitive type",
+                ));
+            };
+
+            match (&self.data_type, primitive.clone()) {
+                (DataType::Boolean, PrimitiveLiteral::Boolean(value)) => {
+                    self.builder::<BooleanBuilder>()?.append_value(value)
+                }
+                (DataType::Int32, PrimitiveLiteral::Int(value)) => {
+                    self.builder::<Int32Builder>()?.append_value(value)
+                }
+                (DataType::Int64, PrimitiveLiteral::Long(value)) => {
+                    self.builder::<Int64Builder>()?.append_value(value)
+                }
+                (DataType::Float32, PrimitiveLiteral::Float(OrderedFloat(value))) => {
+                    self.builder::<Float32Builder>()?.append_value(value)
+                }
+                (DataType::Float64, PrimitiveLiteral::Double(OrderedFloat(value))) => {
+                    self.builder::<Float64Builder>()?.append_value(value)
+                }
+                (DataType::Utf8, PrimitiveLiteral::String(value)) => {
+                    self.builder::<StringBuilder>()?.append_value(value)
+                }
+                (DataType::FixedSizeBinary(_), PrimitiveLiteral::Binary(value)) => self
+                    .builder::<FixedSizeBinaryBuilder>()?
+                    .append_value(value)?,
+                (DataType::LargeBinary, PrimitiveLiteral::Binary(value)) => {
+                    self.builder::<LargeBinaryBuilder>()?.append_value(value)
+                }
+                (_, _) => {
+                    return Err(Error::new(
+                        ErrorKind::FeatureUnsupported,
+                        format!(
+                            "Builder of type {:?} does not accept literal {:?}",
+                            self.data_type, primitive
+                        ),
+                    ));
+                }
+            }
+
+            Ok(())
+        }
+
+        /// Append a null value for the provided [DataType].
+        pub(crate) fn append_null(&mut self) -> crate::Result<()> {
+            match self.data_type {
+                DataType::Boolean => self.builder::<BooleanBuilder>()?.append_null(),
+                DataType::Int32 => self.builder::<Int32Builder>()?.append_null(),
+                DataType::Int64 => self.builder::<Int64Builder>()?.append_null(),
+                DataType::Float32 => self.builder::<Float32Builder>()?.append_null(),
+                DataType::Float64 => self.builder::<Float64Builder>()?.append_null(),
+                DataType::Decimal128(_, _) => self.builder::<Decimal128Builder>()?.append_null(),
+                DataType::Date32 => self.builder::<Date32Builder>()?.append_null(),
+                DataType::Time64(TimeUnit::Microsecond) => {
+                    self.builder::<Time64MicrosecondBuilder>()?.append_null()
+                }
+                DataType::Timestamp(TimeUnit::Microsecond, _) => {
+                    self.builder::<TimestampMicrosecondBuilder>()?.append_null()
+                }
+                DataType::Timestamp(TimeUnit::Nanosecond, _) => {
+                    self.builder::<TimestampNanosecondBuilder>()?.append_null()
+                }
+                DataType::Utf8 => self.builder::<StringBuilder>()?.append_null(),
+                DataType::FixedSizeBinary(_) => {
+                    self.builder::<FixedSizeBinaryBuilder>()?.append_null()
+                }
+                DataType::LargeBinary => self.builder::<LargeBinaryBuilder>()?.append_null(),
+                _ => {
+                    return Err(Error::new(
+                        ErrorKind::FeatureUnsupported,
+                        format!(
+                            "Cannot append null values for data type: {:?}",
+                            self.data_type
+                        ),
+                    ))
+                }
+            }
+            Ok(())
+        }
+
+        /// Cast the `inner` builder to a specific type or return [Error].
+        fn builder<T: ArrayBuilder>(&mut self) -> crate::Result<&mut T> {
+            self.inner.as_any_mut().downcast_mut::<T>().ok_or_else(|| {
+                Error::new(
+                    ErrorKind::Unexpected,
+                    "Failed to cast builder to expected type",
+                )
+            })
+        }
+    }
+}
+
 impl TryFrom<&ArrowSchema> for crate::spec::Schema {
     type Error = Error;
 
diff --git a/crates/iceberg/src/inspect/entries.rs b/crates/iceberg/src/inspect/entries.rs
new file mode 100644
index 000000000..02d33229e
--- /dev/null
+++ b/crates/iceberg/src/inspect/entries.rs
@@ -0,0 +1,671 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use std::collections::HashMap;
+use std::sync::Arc;
+
+use arrow_array::builder::{
+    BinaryBuilder, Int32Builder, Int64Builder, Int8Builder, ListBuilder, MapBuilder, StringBuilder,
+};
+use arrow_array::{ArrayRef, RecordBatch, StructArray};
+use arrow_schema::{DataType, Field, FieldRef, Fields, Schema};
+use async_stream::try_stream;
+use futures::StreamExt;
+use itertools::Itertools;
+
+use crate::arrow::builder::AnyArrayBuilder;
+use crate::arrow::{get_arrow_datum, schema_to_arrow_schema, type_to_arrow_type};
+use crate::scan::ArrowRecordBatchStream;
+use crate::spec::{
+    DataFile, ManifestFile, PartitionField, PartitionSpec, SchemaRef, Struct, TableMetadata,
+};
+use crate::table::Table;
+use crate::{Error, ErrorKind, Result};
+
+/// Entries table containing the entries of the current snapshot's manifest files.
+///
+/// The table has one row for each manifest file entry in the current snapshot's manifest list file.
+/// For reference, see the Java implementation of [`ManifestEntry`][1].
+///
+/// [1]: https://github.com/apache/iceberg/blob/apache-iceberg-1.7.1/core/src/main/java/org/apache/iceberg/ManifestEntry.java
+pub struct EntriesTable<'a> {
+    table: &'a Table,
+}
+
+impl<'a> EntriesTable<'a> {
+    /// Create a new Entries table instance.
+    pub fn new(table: &'a Table) -> Self {
+        Self { table }
+    }
+
+    /// Get the schema for the manifest entries table.
+    pub fn schema(&self) -> Schema {
+        Schema::new(vec![
+            Field::new("status", DataType::Int32, false),
+            Field::new("snapshot_id", DataType::Int64, true),
+            Field::new("sequence_number", DataType::Int64, true),
+            Field::new("file_sequence_number", DataType::Int64, true),
+            Field::new(
+                "data_file",
+                DataType::Struct(DataFileStructBuilder::fields(self.table.metadata())),
+                false,
+            ),
+            Field::new(
+                "readable_metrics",
+                DataType::Struct(
+                    ReadableMetricsStructBuilder::fields(self.table.metadata().current_schema())
+                        .expect("Failed to build schema for readable metrics"),
+                ),
+                false,
+            ),
+        ])
+    }
+
+    /// Scan the manifest entries table.
+    pub async fn scan(&self) -> Result<ArrowRecordBatchStream> {
+        let current_snapshot = self.table.metadata().current_snapshot().ok_or_else(|| {
+            Error::new(
+                ErrorKind::Unexpected,
+                "Cannot scan entries for table without current snapshot",
+            )
+        })?;
+
+        let manifest_list = current_snapshot
+            .load_manifest_list(self.table.file_io(), self.table.metadata())
+            .await?;
+
+        // Copy to ensure that the stream can take ownership of these dependencies
+        let arrow_schema = Arc::new(self.schema());
+        let table_metadata = self.table.metadata_ref();
+        let file_io = Arc::new(self.table.file_io().clone());
+
+        Ok(try_stream! {
+            for manifest_file in manifest_list.entries() {
+                let mut status = Int32Builder::new();
+                let mut snapshot_id = Int64Builder::new();
+                let mut sequence_number = Int64Builder::new();
+                let mut file_sequence_number = Int64Builder::new();
+                let mut data_file = DataFileStructBuilder::new(&table_metadata);
+                let mut readable_metrics =
+                    ReadableMetricsStructBuilder::new(table_metadata.current_schema())?;
+
+                for manifest_entry in manifest_file.load_manifest(&file_io).await?.entries() {
+                    status.append_value(manifest_entry.status() as i32);
+                    snapshot_id.append_option(manifest_entry.snapshot_id());
+                    sequence_number.append_option(manifest_entry.sequence_number());
+                    file_sequence_number.append_option(manifest_entry.file_sequence_number());
+                    data_file.append(manifest_file, manifest_entry.data_file())?;
+                    readable_metrics.append(manifest_entry.data_file())?;
+                }
+
+                let batch = RecordBatch::try_new(arrow_schema.clone(), vec![
+                    Arc::new(status.finish()),
+                    Arc::new(snapshot_id.finish()),
+                    Arc::new(sequence_number.finish()),
+                    Arc::new(file_sequence_number.finish()),
+                    Arc::new(data_file.finish()),
+                    Arc::new(readable_metrics.finish()),
+                ])?;
+
+                yield batch;
+            }
+        }
+        .boxed())
+    }
+}
+
+/// Builds the struct describing data files listed in a table manifest.
+///
+/// For reference, see the Java implementation of [`DataFile`][1].
+///
+/// [1]: https://github.com/apache/iceberg/blob/apache-iceberg-1.7.1/api/src/main/java/org/apache/iceberg/DataFile.java
+struct DataFileStructBuilder<'a> {
+    // Reference to table metadata to retrieve partition specs based on partition spec ids
+    table_metadata: &'a TableMetadata,
+    // Below are the field builders of the "data_file" struct
+    content: Int8Builder,
+    file_path: StringBuilder,
+    file_format: StringBuilder,
+    partition: PartitionValuesStructBuilder,
+    record_count: Int64Builder,
+    file_size_in_bytes: Int64Builder,
+    column_sizes: MapBuilder<Int32Builder, Int64Builder>,
+    value_counts: MapBuilder<Int32Builder, Int64Builder>,
+    null_value_counts: MapBuilder<Int32Builder, Int64Builder>,
+    nan_value_counts: MapBuilder<Int32Builder, Int64Builder>,
+    lower_bounds: MapBuilder<Int32Builder, BinaryBuilder>,
+    upper_bounds: MapBuilder<Int32Builder, BinaryBuilder>,
+    key_metadata: BinaryBuilder,
+    split_offsets: ListBuilder<Int64Builder>,
+    equality_ids: ListBuilder<Int32Builder>,
+    sort_order_ids: Int32Builder,
+}
+
+impl<'a> DataFileStructBuilder<'a> {
+    fn new(table_metadata: &'a TableMetadata) -> Self {
+        Self {
+            table_metadata,
+            content: Int8Builder::new(),
+            file_path: StringBuilder::new(),
+            file_format: StringBuilder::new(),
+            partition: PartitionValuesStructBuilder::new(table_metadata),
+            record_count: Int64Builder::new(),
+            file_size_in_bytes: Int64Builder::new(),
+            column_sizes: MapBuilder::new(None, Int32Builder::new(), Int64Builder::new()),
+            value_counts: MapBuilder::new(None, Int32Builder::new(), Int64Builder::new()),
+            null_value_counts: MapBuilder::new(None, Int32Builder::new(), Int64Builder::new()),
+            nan_value_counts: MapBuilder::new(None, Int32Builder::new(), Int64Builder::new()),
+            lower_bounds: MapBuilder::new(None, Int32Builder::new(), BinaryBuilder::new()),
+            upper_bounds: MapBuilder::new(None, Int32Builder::new(), BinaryBuilder::new()),
+            key_metadata: BinaryBuilder::new(),
+            split_offsets: ListBuilder::new(Int64Builder::new()),
+            equality_ids: ListBuilder::new(Int32Builder::new()),
+            sort_order_ids: Int32Builder::new(),
+        }
+    }
+
+    fn fields(table_metadata: &TableMetadata) -> Fields {
+        vec![
+            Field::new("content", DataType::Int8, false),
+            Field::new("file_path", DataType::Utf8, false),
+            Field::new("file_format", DataType::Utf8, false),
+            Field::new(
+                "partition",
+                DataType::Struct(PartitionValuesStructBuilder::combined_partition_fields(
+                    table_metadata,
+                )),
+                false,
+            ),
+            Field::new("record_count", DataType::Int64, false),
+            Field::new("file_size_in_bytes", DataType::Int64, false),
+            Field::new(
+                "column_sizes",
+                Self::column_id_to_value_type(DataType::Int64),
+                true,
+            ),
+            Field::new(
+                "value_counts",
+                Self::column_id_to_value_type(DataType::Int64),
+                true,
+            ),
+            Field::new(
+                "null_value_counts",
+                Self::column_id_to_value_type(DataType::Int64),
+                true,
+            ),
+            Field::new(
+                "nan_value_counts",
+                Self::column_id_to_value_type(DataType::Int64),
+                true,
+            ),
+            Field::new(
+                "lower_bounds",
+                Self::column_id_to_value_type(DataType::Binary),
+                true,
+            ),
+            Field::new(
+                "upper_bounds",
+                Self::column_id_to_value_type(DataType::Binary),
+                true,
+            ),
+            Field::new("key_metadata", DataType::Binary, true),
+            Field::new(
+                "split_offsets",
+                DataType::new_list(DataType::Int64, true),
+                true,
+            ),
+            Field::new(
+                "equality_ids",
+                DataType::new_list(DataType::Int32, true),
+                true,
+            ),
+            Field::new("sort_order_id", DataType::Int32, true),
+        ]
+        .into()
+    }
+
+    /// Construct a new struct type that maps from column ids (i32) to the provided value type.
+    /// Keys, values, and the whole struct are non-nullable.
+    fn column_id_to_value_type(value_type: DataType) -> DataType {
+        DataType::Map(
+            Arc::new(Field::new(
+                "entries",
+                DataType::Struct(
+                    vec![
+                        Field::new("keys", DataType::Int32, false),
+                        Field::new("values", value_type, true),
+                    ]
+                    .into(),
+                ),
+                false,
+            )),
+            false,
+        )
+    }
+
+    fn append(&mut self, manifest_file: &ManifestFile, data_file: &DataFile) -> Result<()> {
+        self.content.append_value(data_file.content as i8);
+        self.file_path.append_value(data_file.file_path());
+        self.file_format
+            .append_value(data_file.file_format().to_string().to_uppercase());
+        self.partition.append(
+            self.partition_spec(manifest_file)?.clone().fields(),
+            data_file.partition(),
+        )?;
+        self.record_count
+            .append_value(data_file.record_count() as i64);
+        self.file_size_in_bytes
+            .append_value(data_file.file_size_in_bytes() as i64);
+
+        // Sort keys to get matching order between rows
+        for (k, v) in data_file.column_sizes.iter().sorted_by_key(|(k, _)| *k) {
+            self.column_sizes.keys().append_value(*k);
+            self.column_sizes.values().append_value(*v as i64);
+        }
+        self.column_sizes.append(true)?;
+
+        for (k, v) in data_file.value_counts.iter().sorted_by_key(|(k, _)| *k) {
+            self.value_counts.keys().append_value(*k);
+            self.value_counts.values().append_value(*v as i64);
+        }
+        self.value_counts.append(true)?;
+
+        for (k, v) in data_file
+            .null_value_counts
+            .iter()
+            .sorted_by_key(|(k, _)| *k)
+        {
+            self.null_value_counts.keys().append_value(*k);
+            self.null_value_counts.values().append_value(*v as i64);
+        }
+        self.null_value_counts.append(true)?;
+
+        for (k, v) in data_file.nan_value_counts.iter().sorted_by_key(|(k, _)| *k) {
+            self.nan_value_counts.keys().append_value(*k);
+            self.nan_value_counts.values().append_value(*v as i64);
+        }
+        self.nan_value_counts.append(true)?;
+
+        for (k, v) in data_file.lower_bounds.iter().sorted_by_key(|(k, _)| *k) {
+            self.lower_bounds.keys().append_value(*k);
+            self.lower_bounds.values().append_value(v.to_bytes()?);
+        }
+        self.lower_bounds.append(true)?;
+
+        for (k, v) in data_file.upper_bounds.iter().sorted_by_key(|(k, _)| *k) {
+            self.upper_bounds.keys().append_value(*k);
+            self.upper_bounds.values().append_value(v.to_bytes()?);
+        }
+        self.upper_bounds.append(true)?;
+
+        self.key_metadata.append_option(data_file.key_metadata());
+
+        self.split_offsets
+            .values()
+            .append_slice(data_file.split_offsets());
+        self.split_offsets.append(true);
+
+        self.equality_ids
+            .values()
+            .append_slice(data_file.equality_ids());
+        self.equality_ids.append(true);
+
+        self.sort_order_ids.append_option(data_file.sort_order_id());
+        Ok(())
+    }
+
+    fn partition_spec(&self, manifest_file: &ManifestFile) -> Result<&PartitionSpec> {
+        self.table_metadata
+            .partition_spec_by_id(manifest_file.partition_spec_id)
+            .ok_or_else(|| {
+                Error::new(
+                    ErrorKind::Unexpected,
+                    "Partition spec not found for manifest file",
+                )
+            })
+            .map(|spec| spec.as_ref())
+    }
+
+    fn finish(&mut self) -> StructArray {
+        let inner_arrays: Vec<ArrayRef> = vec![
+            Arc::new(self.content.finish()),
+            Arc::new(self.file_path.finish()),
+            Arc::new(self.file_format.finish()),
+            Arc::new(self.partition.finish()),
+            Arc::new(self.record_count.finish()),
+            Arc::new(self.file_size_in_bytes.finish()),
+            Arc::new(self.column_sizes.finish()),
+            Arc::new(self.value_counts.finish()),
+            Arc::new(self.null_value_counts.finish()),
+            Arc::new(self.nan_value_counts.finish()),
+            Arc::new(self.lower_bounds.finish()),
+            Arc::new(self.upper_bounds.finish()),
+            Arc::new(self.key_metadata.finish()),
+            Arc::new(self.split_offsets.finish()),
+            Arc::new(self.equality_ids.finish()),
+            Arc::new(self.sort_order_ids.finish()),
+        ];
+
+        StructArray::from(
+            Self::fields(self.table_metadata)
+                .into_iter()
+                .cloned()
+                .zip_eq(inner_arrays)
+                .collect::<Vec<(FieldRef, ArrayRef)>>(),
+        )
+    }
+}
+
+/// Builds a readable metrics struct for a single column.
+///
+/// For reference, see [Java][1] and [Python][2] implementations.
+///
+/// [1]: https://github.com/apache/iceberg/blob/4a432839233f2343a9eae8255532f911f06358ef/core/src/main/java/org/apache/iceberg/MetricsUtil.java#L337
+/// [2]: https://github.com/apache/iceberg-python/blob/a051584a3684392d2db6556449eb299145d47d15/pyiceberg/table/inspect.py#L101-L110
+struct PerColumnReadableMetricsBuilder {
+    field_id: i32,
+    data_type: DataType,
+    column_size: Int64Builder,
+    value_count: Int64Builder,
+    null_value_count: Int64Builder,
+    nan_value_count: Int64Builder,
+    lower_bound: AnyArrayBuilder,
+    upper_bound: AnyArrayBuilder,
+}
+
+impl PerColumnReadableMetricsBuilder {
+    fn fields(data_type: &DataType) -> Fields {
+        vec![
+            Field::new("column_size", DataType::Int64, true),
+            Field::new("value_count", DataType::Int64, true),
+            Field::new("null_value_count", DataType::Int64, true),
+            Field::new("nan_value_count", DataType::Int64, true),
+            Field::new("lower_bound", data_type.clone(), true),
+            Field::new("upper_bound", data_type.clone(), true),
+        ]
+        .into()
+    }
+
+    fn new_for_field(field_id: i32, data_type: &DataType) -> Self {
+        Self {
+            field_id,
+            data_type: data_type.clone(),
+            column_size: Int64Builder::new(),
+            value_count: Int64Builder::new(),
+            null_value_count: Int64Builder::new(),
+            nan_value_count: Int64Builder::new(),
+            lower_bound: AnyArrayBuilder::new(data_type),
+            upper_bound: AnyArrayBuilder::new(data_type),
+        }
+    }
+
+    fn append(&mut self, data_file: &DataFile) -> Result<()> {
+        self.column_size.append_option(
+            data_file
+                .column_sizes()
+                .get(&self.field_id)
+                .map(|&v| v as i64),
+        );
+        self.value_count.append_option(
+            data_file
+                .value_counts()
+                .get(&self.field_id)
+                .map(|&v| v as i64),
+        );
+        self.null_value_count.append_option(
+            data_file
+                .null_value_counts()
+                .get(&self.field_id)
+                .map(|&v| v as i64),
+        );
+        self.nan_value_count.append_option(
+            data_file
+                .nan_value_counts()
+                .get(&self.field_id)
+                .map(|&v| v as i64),
+        );
+        match data_file.lower_bounds().get(&self.field_id) {
+            Some(datum) => self
+                .lower_bound
+                .append_datum(get_arrow_datum(datum)?.as_ref())?,
+            None => self.lower_bound.append_null()?,
+        }
+        match data_file.upper_bounds().get(&self.field_id) {
+            Some(datum) => self
+                .upper_bound
+                .append_datum(get_arrow_datum(datum)?.as_ref())?,
+            None => self.upper_bound.append_null()?,
+        }
+        Ok(())
+    }
+
+    fn finish(&mut self) -> StructArray {
+        let inner_arrays: Vec<ArrayRef> = vec![
+            Arc::new(self.column_size.finish()),
+            Arc::new(self.value_count.finish()),
+            Arc::new(self.null_value_count.finish()),
+            Arc::new(self.nan_value_count.finish()),
+            Arc::new(self.lower_bound.finish()),
+            Arc::new(self.upper_bound.finish()),
+        ];
+
+        StructArray::from(
+            Self::fields(&self.data_type)
+                .into_iter()
+                .cloned()
+                .zip_eq(inner_arrays)
+                .collect::<Vec<(FieldRef, ArrayRef)>>(),
+        )
+    }
+}
+
+/// Build a [StructArray] with partition columns as fields and partition values as rows.
+struct PartitionValuesStructBuilder {
+    fields: Fields,
+    builders: Vec<AnyArrayBuilder>,
+}
+
+impl PartitionValuesStructBuilder {
+    /// Construct a new builder from the combined partition columns of the table metadata.
+    fn new(table_metadata: &TableMetadata) -> Self {
+        let combined_fields = Self::combined_partition_fields(table_metadata);
+        Self {
+            builders: combined_fields
+                .iter()
+                .map(|field| AnyArrayBuilder::new(field.data_type()))
+                .collect_vec(),
+            fields: combined_fields,
+        }
+    }
+
+    /// Build the combined partition spec union-ing past and current partition specs
+    fn combined_partition_fields(table_metadata: &TableMetadata) -> Fields {
+        let combined_fields: HashMap<i32, &PartitionField> = table_metadata
+            .partition_specs_iter()
+            .flat_map(|spec| spec.fields())
+            .map(|field| (field.field_id, field))
+            .collect();
+
+        combined_fields
+            .into_iter()
+            // Sort by field id to get a deterministic order
+            .sorted_by_key(|(id, _)| *id)
+            .map(|(_, field)| {
+                let source_type = &table_metadata
+                    .current_schema()
+                    .field_by_id(field.source_id)
+                    .unwrap()
+                    .field_type;
+                let result_type = field.transform.result_type(source_type).unwrap();
+                Field::new(
+                    field.name.clone(),
+                    type_to_arrow_type(&result_type).unwrap(),
+                    true,
+                )
+            })
+            .collect()
+    }
+
+    fn append(
+        &mut self,
+        partition_fields: &[PartitionField],
+        partition_values: &Struct,
+    ) -> Result<()> {
+        for (field, value) in partition_fields.iter().zip_eq(partition_values.iter()) {
+            let index = self.find_field(&field.name)?;
+
+            match value {
+                Some(literal) => self.builders[index].append_literal(literal)?,
+                None => self.builders[index].append_null()?,
+            }
+        }
+        Ok(())
+    }
+
+    fn finish(&mut self) -> StructArray {
+        let arrays: Vec<ArrayRef> = self
+            .builders
+            .iter_mut()
+            .map::<ArrayRef, _>(|builder| Arc::new(builder.finish()))
+            .collect();
+        StructArray::from(
+            self.fields
+                .iter()
+                .cloned()
+                .zip_eq(arrays)
+                .collect::<Vec<(FieldRef, ArrayRef)>>(),
+        )
+    }
+
+    fn find_field(&self, name: &str) -> Result<usize> {
+        match self.fields.find(name) {
+            Some((index, _)) => Ok(index),
+            None => Err(Error::new(
+                ErrorKind::Unexpected,
+                format!("Field not found: {}", name),
+            )),
+        }
+    }
+}
+
+struct ReadableMetricsStructBuilder<'a> {
+    table_schema: &'a SchemaRef,
+    column_builders: Vec<PerColumnReadableMetricsBuilder>,
+}
+
+impl<'a> ReadableMetricsStructBuilder<'a> {
+    /// Helper to construct per-column readable metrics. The metrics are "readable" in that the reported
+    /// and lower and upper bounds are reported as deserialized values.
+    fn fields(table_schema: &SchemaRef) -> Result<Fields> {
+        let arrow_schema = schema_to_arrow_schema(table_schema)?;
+
+        Ok(arrow_schema
+            .fields()
+            .iter()
+            .map(|field| {
+                Field::new(
+                    field.name(),
+                    DataType::Struct(PerColumnReadableMetricsBuilder::fields(field.data_type())),
+                    false,
+                )
+            })
+            .collect_vec()
+            .into())
+    }
+
+    fn new(table_schema: &'a SchemaRef) -> Result<ReadableMetricsStructBuilder> {
+        Ok(Self {
+            table_schema,
+            column_builders: table_schema
+                .as_struct()
+                .fields()
+                .iter()
+                .map(|field| {
+                    type_to_arrow_type(&field.field_type).map(|arrow_type| {
+                        PerColumnReadableMetricsBuilder::new_for_field(field.id, &arrow_type)
+                    })
+                })
+                .collect::<Result<Vec<_>>>()?,
+        })
+    }
+
+    fn append(&mut self, data_file: &DataFile) -> Result<()> {
+        for column_builder in &mut self.column_builders {
+            column_builder.append(data_file)?;
+        }
+        Ok(())
+    }
+
+    fn finish(&mut self) -> StructArray {
+        let fields: Vec<FieldRef> = Self::fields(self.table_schema)
+            // We already checked the schema conversion in the constructor
+            .unwrap()
+            .into_iter()
+            .cloned()
+            .collect();
+        let arrays: Vec<ArrayRef> = self
+            .column_builders
+            .iter_mut()
+            .map::<ArrayRef, _>(|builder| Arc::new(builder.finish()))
+            .collect();
+        StructArray::from(
+            fields
+                .into_iter()
+                .zip_eq(arrays)
+                .collect::<Vec<(FieldRef, ArrayRef)>>(),
+        )
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use expect_test::expect;
+
+    use crate::inspect::metadata_table::tests::check_record_batches;
+    use crate::scan::tests::TableTestFixture;
+
+    #[tokio::test]
+    async fn test_entries_table() {
+        let mut fixture = TableTestFixture::new();
+        fixture.setup_manifest_files().await;
+        let table = fixture.table;
+
+        let batch_stream = table.inspect().entries().scan().await.unwrap();
+
+        check_record_batches(
+            batch_stream,
+            expect![[r#"
+                Field { name: "status", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} },
+                Field { name: "snapshot_id", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} },
+                Field { name: "sequence_number", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} },
+                Field { name: "file_sequence_number", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} },
+                Field { name: "data_file", data_type: Struct([Field { name: "content", data_type: Int8, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "file_path", data_type: Utf8, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "file_format", data_type: Utf8, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "partition", data_type: Struct([Field { name: "x", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "record_count", data_type: Int64, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "file_size_in_bytes", data_type: Int64, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "column_sizes", data_type: Map(Field { name: "entries", data_type: Struct([Field { name: "keys", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "values", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, false), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_counts", data_type: Map(Field { name: "entries", data_type: Struct([Field { name: "keys", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "values", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, false), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_counts", data_type: Map(Field { name: "entries", data_type: Struct([Field { name: "keys", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "values", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, false), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_counts", data_type: Map(Field { name: "entries", data_type: Struct([Field { name: "keys", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "values", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, false), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bounds", data_type: Map(Field { name: "entries", data_type: Struct([Field { name: "keys", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "values", data_type: Binary, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, false), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bounds", data_type: Map(Field { name: "entries", data_type: Struct([Field { name: "keys", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "values", data_type: Binary, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, false), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "key_metadata", data_type: Binary, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "split_offsets", data_type: List(Field { name: "item", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "equality_ids", data_type: List(Field { name: "item", data_type: Int32, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "sort_order_id", data_type: Int32, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} },
+                Field { name: "readable_metrics", data_type: Struct([Field { name: "x", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "y", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "z", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "a", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Utf8, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Utf8, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "dbl", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Float64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Float64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "i32", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Int32, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Int32, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "i64", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "bool", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Boolean, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Boolean, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "float", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Float32, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Float32, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "decimal", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Decimal128(3, 2), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Decimal128(3, 2), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "date", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Date32, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Date32, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "timestamp", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Timestamp(Microsecond, None), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Timestamp(Microsecond, None), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "timestamptz", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Timestamp(Microsecond, Some("+00:00")), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Timestamp(Microsecond, Some("+00:00")), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "timestampns", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Timestamp(Nanosecond, None), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Timestamp(Nanosecond, None), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "timestamptzns", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Timestamp(Nanosecond, Some("+00:00")), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Timestamp(Nanosecond, Some("+00:00")), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "binary", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: LargeBinary, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: LargeBinary, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }"#]],
+            expect![[r#"
+                +--------+---------------------+-----------------+----------------------+------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------+---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------+
+                | status | snapshot_id         | sequence_number | file_sequence_number | data_file                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    | readable_metrics                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
+                +--------+---------------------+-----------------+----------------------+------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------+---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------+
+                | 1      | 3055729675574597004 | 1               | 1                    | {content: 0, file_format: PARQUET, partition: {x: 100}, record_count: 1, file_size_in_bytes: 100, column_sizes: {1: 1, 2: 1}, value_counts: {1: 2, 2: 2}, null_value_counts: {1: 3, 2: 3}, nan_value_counts: {1: 4, 2: 4}, lower_bounds: {1: 0100000000000000, 2: 0200000000000000, 3: 0300000000000000, 4: 417061636865, 5: 0000000000005940, 6: 64000000, 7: 6400000000000000, 8: 00, 9: 0000c842, 11: 00000000, 12: 0000000000000000, 13: 0000000000000000}, upper_bounds: {1: 0100000000000000, 2: 0500000000000000, 3: 0400000000000000, 4: 49636562657267, 5: 0000000000006940, 6: c8000000, 7: c800000000000000, 8: 01, 9: 00004843, 11: 00000000, 12: 0000000000000000, 13: 0000000000000000}, key_metadata: , split_offsets: [], equality_ids: [], sort_order_id: } | {x: {column_size: 1, value_count: 2, null_value_count: 3, nan_value_count: 4, lower_bound: 1, upper_bound: 1}, y: {column_size: 1, value_count: 2, null_value_count: 3, nan_value_count: 4, lower_bound: 2, upper_bound: 5}, z: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 3, upper_bound: 4}, a: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: Apache, upper_bound: Iceberg}, dbl: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 100.0, upper_bound: 200.0}, i32: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 100, upper_bound: 200}, i64: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 100, upper_bound: 200}, bool: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: false, upper_bound: true}, float: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 100.0, upper_bound: 200.0}, decimal: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, date: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 1970-01-01, upper_bound: 1970-01-01}, timestamp: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 1970-01-01T00:00:00, upper_bound: 1970-01-01T00:00:00}, timestamptz: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 1970-01-01T00:00:00Z, upper_bound: 1970-01-01T00:00:00Z}, timestampns: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestamptzns: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, binary: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }} |
+                | 2      | 3055729675574597004 | 0               | 0                    | {content: 0, file_format: PARQUET, partition: {x: 200}, record_count: 1, file_size_in_bytes: 100, column_sizes: {}, value_counts: {}, null_value_counts: {}, nan_value_counts: {}, lower_bounds: {}, upper_bounds: {}, key_metadata: , split_offsets: [], equality_ids: [], sort_order_id: }                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | {x: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, y: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, z: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, a: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, dbl: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, i32: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, i64: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, bool: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, float: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, decimal: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, date: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestamp: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestamptz: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestampns: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestamptzns: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, binary: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }}                                                                                                                                                                       |
+                | 0      | 3051729675574597004 | 0               | 0                    | {content: 0, file_format: PARQUET, partition: {x: 300}, record_count: 1, file_size_in_bytes: 100, column_sizes: {}, value_counts: {}, null_value_counts: {}, nan_value_counts: {}, lower_bounds: {}, upper_bounds: {}, key_metadata: , split_offsets: [], equality_ids: [], sort_order_id: }                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | {x: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, y: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, z: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, a: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, dbl: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, i32: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, i64: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, bool: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, float: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, decimal: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, date: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestamp: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestamptz: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestampns: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestamptzns: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, binary: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }}                                                                                                                                                                       |
+                +--------+---------------------+-----------------+----------------------+------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------+---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------+"#]],
+            &[],
+            &["file_path"],
+            None,
+        ).await;
+    }
+}
diff --git a/crates/iceberg/src/inspect/manifests.rs b/crates/iceberg/src/inspect/manifests.rs
index e94e48a45..8f5da7f8f 100644
--- a/crates/iceberg/src/inspect/manifests.rs
+++ b/crates/iceberg/src/inspect/manifests.rs
@@ -285,75 +285,13 @@ mod tests {
                 Field { name: "deleted_delete_files_count", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "17"} },
                 Field { name: "partition_summaries", data_type: List(Field { name: "item", data_type: Struct([Field { name: "contains_null", data_type: Boolean, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "10"} }, Field { name: "contains_nan", data_type: Boolean, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "11"} }, Field { name: "lower_bound", data_type: Utf8, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "12"} }, Field { name: "upper_bound", data_type: Utf8, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "13"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "9"} }), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "8"} }"#]],
             expect![[r#"
-                content: PrimitiveArray<Int32>
-                [
-                  0,
-                ],
-                path: (skipped),
-                length: (skipped),
-                partition_spec_id: PrimitiveArray<Int32>
-                [
-                  0,
-                ],
-                added_snapshot_id: PrimitiveArray<Int64>
-                [
-                  3055729675574597004,
-                ],
-                added_data_files_count: PrimitiveArray<Int32>
-                [
-                  1,
-                ],
-                existing_data_files_count: PrimitiveArray<Int32>
-                [
-                  1,
-                ],
-                deleted_data_files_count: PrimitiveArray<Int32>
-                [
-                  1,
-                ],
-                added_delete_files_count: PrimitiveArray<Int32>
-                [
-                  1,
-                ],
-                existing_delete_files_count: PrimitiveArray<Int32>
-                [
-                  1,
-                ],
-                deleted_delete_files_count: PrimitiveArray<Int32>
-                [
-                  1,
-                ],
-                partition_summaries: ListArray
-                [
-                  StructArray
-                -- validity: 
-                [
-                  valid,
-                ]
-                [
-                -- child 0: "contains_null" (Boolean)
-                BooleanArray
-                [
-                  false,
-                ]
-                -- child 1: "contains_nan" (Boolean)
-                BooleanArray
-                [
-                  false,
-                ]
-                -- child 2: "lower_bound" (Utf8)
-                StringArray
-                [
-                  "100",
-                ]
-                -- child 3: "upper_bound" (Utf8)
-                StringArray
-                [
-                  "300",
-                ]
-                ],
-                ]"#]],
+                +---------+-------------------+---------------------+------------------------+---------------------------+--------------------------+--------------------------+-----------------------------+----------------------------+-----------------------------------------------------------------------------------+
+                | content | partition_spec_id | added_snapshot_id   | added_data_files_count | existing_data_files_count | deleted_data_files_count | added_delete_files_count | existing_delete_files_count | deleted_delete_files_count | partition_summaries                                                               |
+                +---------+-------------------+---------------------+------------------------+---------------------------+--------------------------+--------------------------+-----------------------------+----------------------------+-----------------------------------------------------------------------------------+
+                | 0       | 0                 | 3055729675574597004 | 1                      | 1                         | 1                        | 1                        | 1                           | 1                          | [{contains_null: false, contains_nan: false, lower_bound: 100, upper_bound: 300}] |
+                +---------+-------------------+---------------------+------------------------+---------------------------+--------------------------+--------------------------+-----------------------------+----------------------------+-----------------------------------------------------------------------------------+"#]],
             &["path", "length"],
+            &[],
             Some("path"),
         ).await;
     }
diff --git a/crates/iceberg/src/inspect/metadata_table.rs b/crates/iceberg/src/inspect/metadata_table.rs
index 75dbc7472..3ea029cf3 100644
--- a/crates/iceberg/src/inspect/metadata_table.rs
+++ b/crates/iceberg/src/inspect/metadata_table.rs
@@ -16,6 +16,7 @@
 // under the License.
 
 use super::{ManifestsTable, SnapshotsTable};
+use crate::inspect::entries::EntriesTable;
 use crate::table::Table;
 
 /// Metadata table is used to inspect a table's history, snapshots, and other metadata as a table.
@@ -33,6 +34,11 @@ impl<'a> MetadataTable<'a> {
         Self(table)
     }
 
+    /// Returns the current manifest file's entries.
+    pub fn entries(&self) -> EntriesTable {
+        EntriesTable::new(self.0)
+    }
+
     /// Get the snapshots table.
     pub fn snapshots(&self) -> SnapshotsTable {
         SnapshotsTable::new(self.0)
@@ -46,6 +52,11 @@ impl<'a> MetadataTable<'a> {
 
 #[cfg(test)]
 pub mod tests {
+    use std::sync::Arc;
+
+    use arrow_array::{ArrayRef, RecordBatch, StructArray};
+    use arrow_cast::pretty::pretty_format_batches;
+    use arrow_schema::{DataType, Field, FieldRef, Schema};
     use expect_test::Expect;
     use futures::TryStreamExt;
     use itertools::Itertools;
@@ -59,12 +70,14 @@ pub mod tests {
     ///   or use rust-analyzer (see [video](https://github.com/rust-analyzer/expect-test)).
     ///   Check the doc of [`expect_test`] for more details.
     /// - `ignore_check_columns`: Some columns are not stable, so we can skip them.
+    /// - `ignore_check_struct_fields`: Same as `ignore_check_columns` but for (top-level) struct fields.
     /// - `sort_column`: The order of the data might be non-deterministic, so we can sort it by a column.
     pub async fn check_record_batches(
         batch_stream: ArrowRecordBatchStream,
         expected_schema: Expect,
         expected_data: Expect,
         ignore_check_columns: &[&str],
+        ignore_check_struct_fields: &[&str],
         sort_column: Option<&str>,
     ) {
         let record_batches = batch_stream.try_collect::<Vec<_>>().await.unwrap();
@@ -85,25 +98,46 @@ pub mod tests {
                 .collect_vec();
         }
 
+        // Filter columns
+        let (fields, columns): (Vec<_>, Vec<_>) = record_batch
+            .schema()
+            .fields
+            .iter()
+            .zip_eq(columns)
+            // Filter ignored columns
+            .filter(|(field, _)| !ignore_check_columns.contains(&field.name().as_str()))
+            // For struct fields, filter ignored struct fields
+            .map(|(field, column)| match field.data_type() {
+                DataType::Struct(fields) => {
+                    let struct_array = column.as_any().downcast_ref::<StructArray>().unwrap();
+                    let filtered: Vec<(FieldRef, ArrayRef)> = fields
+                        .iter()
+                        .zip_eq(struct_array.columns().iter())
+                        .filter(|(f, _)| !ignore_check_struct_fields.contains(&f.name().as_str()))
+                        .map(|(f, c)| (f.clone(), c.clone()))
+                        .collect_vec();
+                    let filtered_struct_type: DataType = DataType::Struct(
+                        filtered.iter().map(|(f, _)| f.clone()).collect_vec().into(),
+                    );
+                    (
+                        Field::new(field.name(), filtered_struct_type, field.is_nullable()).into(),
+                        Arc::new(StructArray::from(filtered)) as ArrayRef,
+                    )
+                }
+                _ => (field.clone(), column),
+            })
+            .unzip();
+
         expected_schema.assert_eq(&format!(
             "{}",
             record_batch.schema().fields().iter().format(",\n")
         ));
-        expected_data.assert_eq(&format!(
-            "{}",
-            record_batch
-                .schema()
-                .fields()
-                .iter()
-                .zip_eq(columns)
-                .map(|(field, column)| {
-                    if ignore_check_columns.contains(&field.name().as_str()) {
-                        format!("{}: (skipped)", field.name())
-                    } else {
-                        format!("{}: {:?}", field.name(), column)
-                    }
-                })
-                .format(",\n")
-        ));
+        expected_data.assert_eq(
+            &pretty_format_batches(&[
+                RecordBatch::try_new(Arc::new(Schema::new(fields)), columns).unwrap()
+            ])
+            .unwrap()
+            .to_string(),
+        );
     }
 }
diff --git a/crates/iceberg/src/inspect/mod.rs b/crates/iceberg/src/inspect/mod.rs
index b64420ea1..02a57e664 100644
--- a/crates/iceberg/src/inspect/mod.rs
+++ b/crates/iceberg/src/inspect/mod.rs
@@ -17,10 +17,12 @@
 
 //! Metadata table APIs.
 
+mod entries;
 mod manifests;
 mod metadata_table;
 mod snapshots;
 
+pub use entries::EntriesTable;
 pub use manifests::ManifestsTable;
 pub use metadata_table::*;
 pub use snapshots::SnapshotsTable;
diff --git a/crates/iceberg/src/inspect/snapshots.rs b/crates/iceberg/src/inspect/snapshots.rs
index 1ee89963d..f5703b043 100644
--- a/crates/iceberg/src/inspect/snapshots.rs
+++ b/crates/iceberg/src/inspect/snapshots.rs
@@ -130,59 +130,14 @@ mod tests {
                 Field { name: "manifest_list", data_type: Utf8, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} },
                 Field { name: "summary", data_type: Map(Field { name: "entries", data_type: Struct([Field { name: "keys", data_type: Utf8, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "values", data_type: Utf8, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, false), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }"#]],
             expect![[r#"
-                committed_at: PrimitiveArray<Timestamp(Millisecond, Some("+00:00"))>
-                [
-                  2018-01-04T21:22:35.770+00:00,
-                  2019-04-12T20:29:15.770+00:00,
-                ],
-                snapshot_id: PrimitiveArray<Int64>
-                [
-                  3051729675574597004,
-                  3055729675574597004,
-                ],
-                parent_id: PrimitiveArray<Int64>
-                [
-                  null,
-                  3051729675574597004,
-                ],
-                operation: StringArray
-                [
-                  "append",
-                  "append",
-                ],
-                manifest_list: (skipped),
-                summary: MapArray
-                [
-                  StructArray
-                -- validity: 
-                [
-                ]
-                [
-                -- child 0: "keys" (Utf8)
-                StringArray
-                [
-                ]
-                -- child 1: "values" (Utf8)
-                StringArray
-                [
-                ]
-                ],
-                  StructArray
-                -- validity: 
-                [
-                ]
-                [
-                -- child 0: "keys" (Utf8)
-                StringArray
-                [
-                ]
-                -- child 1: "values" (Utf8)
-                StringArray
-                [
-                ]
-                ],
-                ]"#]],
+                +--------------------------+---------------------+---------------------+-----------+---------+
+                | committed_at             | snapshot_id         | parent_id           | operation | summary |
+                +--------------------------+---------------------+---------------------+-----------+---------+
+                | 2018-01-04T21:22:35.770Z | 3051729675574597004 |                     | append    | {}      |
+                | 2019-04-12T20:29:15.770Z | 3055729675574597004 | 3051729675574597004 | append    | {}      |
+                +--------------------------+---------------------+---------------------+-----------+---------+"#]],
             &["manifest_list"],
+            &[],
             Some("committed_at"),
         ).await;
     }
diff --git a/crates/iceberg/src/scan.rs b/crates/iceberg/src/scan.rs
index bfa1266dd..cfcf45af9 100644
--- a/crates/iceberg/src/scan.rs
+++ b/crates/iceberg/src/scan.rs
@@ -1123,8 +1123,11 @@ pub mod tests {
     use std::sync::Arc;
 
     use arrow_array::{
-        ArrayRef, BooleanArray, Float64Array, Int32Array, Int64Array, RecordBatch, StringArray,
+        ArrayRef, BooleanArray, Date32Array, Decimal128Array, Float32Array, Float64Array,
+        Int32Array, Int64Array, LargeBinaryArray, RecordBatch, StringArray,
+        TimestampMicrosecondArray, TimestampNanosecondArray,
     };
+    use arrow_schema::{DataType, TimeUnit};
     use futures::{stream, TryStreamExt};
     use parquet::arrow::{ArrowWriter, PARQUET_FIELD_ID_META_KEY};
     use parquet::basic::Compression;
@@ -1284,6 +1287,50 @@ pub mod tests {
                                 .record_count(1)
                                 .partition(Struct::from_iter([Some(Literal::long(100))]))
                                 .key_metadata(None)
+                                // Note:
+                                // The bounds below need to agree with the test data written below
+                                // into the Parquet file. If not, tests that rely on filter scans
+                                // fail because of wrong bounds.
+                                .lower_bounds(HashMap::from([
+                                    (1, Datum::long(1)),
+                                    (2, Datum::long(2)),
+                                    (3, Datum::long(3)),
+                                    (4, Datum::string("Apache")),
+                                    (5, Datum::double(100)),
+                                    (6, Datum::int(100)),
+                                    (7, Datum::long(100)),
+                                    (8, Datum::bool(false)),
+                                    (9, Datum::float(100.0)),
+                                    // decimal values are not supported by schema::get_arrow_datum
+                                    // (10, Datum::decimal(Decimal(123, 2))),
+                                    (11, Datum::date(0)),
+                                    (12, Datum::timestamp_micros(0)),
+                                    (13, Datum::timestamptz_micros(0)),
+                                    // ns timestamps, uuid, fixed, binary are currently not
+                                    // supported in schema::get_arrow_datum
+                                ]))
+                                .upper_bounds(HashMap::from([
+                                    (1, Datum::long(1)),
+                                    (2, Datum::long(5)),
+                                    (3, Datum::long(4)),
+                                    (4, Datum::string("Iceberg")),
+                                    (5, Datum::double(200)),
+                                    (6, Datum::int(200)),
+                                    (7, Datum::long(200)),
+                                    (8, Datum::bool(true)),
+                                    (9, Datum::float(200.0)),
+                                    // decimal values are not supported by schema::get_arrow_datum
+                                    // (10, Datum::decimal(Decimal(123, 2))),
+                                    (11, Datum::date(0)),
+                                    (12, Datum::timestamp_micros(0)),
+                                    (13, Datum::timestamptz_micros(0)),
+                                    // ns timestamps, uuid, fixed, binary are currently not
+                                    // supported in schema::get_arrow_datum
+                                ]))
+                                .column_sizes(HashMap::from([(1, 1u64), (2, 1u64)]))
+                                .value_counts(HashMap::from([(1, 2u64), (2, 2u64)]))
+                                .null_value_counts(HashMap::from([(1, 3u64), (2, 3u64)]))
+                                .nan_value_counts(HashMap::from([(1, 4u64), (2, 4u64)]))
                                 .build()
                                 .unwrap(),
                         )
@@ -1392,6 +1439,69 @@ pub mod tests {
                             PARQUET_FIELD_ID_META_KEY.to_string(),
                             "8".to_string(),
                         )])),
+                    arrow_schema::Field::new("float", arrow_schema::DataType::Float32, false)
+                        .with_metadata(HashMap::from([(
+                            PARQUET_FIELD_ID_META_KEY.to_string(),
+                            "9".to_string(),
+                        )])),
+                    arrow_schema::Field::new(
+                        "decimal",
+                        arrow_schema::DataType::Decimal128(3, 2),
+                        false,
+                    )
+                    .with_metadata(HashMap::from([(
+                        PARQUET_FIELD_ID_META_KEY.to_string(),
+                        "10".to_string(),
+                    )])),
+                    arrow_schema::Field::new("date", arrow_schema::DataType::Date32, false)
+                        .with_metadata(HashMap::from([(
+                            PARQUET_FIELD_ID_META_KEY.to_string(),
+                            "11".to_string(),
+                        )])),
+                    arrow_schema::Field::new(
+                        "timestamp",
+                        arrow_schema::DataType::Timestamp(TimeUnit::Microsecond, None),
+                        false,
+                    )
+                    .with_metadata(HashMap::from([(
+                        PARQUET_FIELD_ID_META_KEY.to_string(),
+                        "12".to_string(),
+                    )])),
+                    arrow_schema::Field::new(
+                        "timestamptz",
+                        arrow_schema::DataType::Timestamp(
+                            TimeUnit::Microsecond,
+                            Some("UTC".into()),
+                        ),
+                        false,
+                    )
+                    .with_metadata(HashMap::from([(
+                        PARQUET_FIELD_ID_META_KEY.to_string(),
+                        "13".to_string(),
+                    )])),
+                    arrow_schema::Field::new(
+                        "timestampns",
+                        arrow_schema::DataType::Timestamp(TimeUnit::Nanosecond, None),
+                        false,
+                    )
+                    .with_metadata(HashMap::from([(
+                        PARQUET_FIELD_ID_META_KEY.to_string(),
+                        "14".to_string(),
+                    )])),
+                    arrow_schema::Field::new(
+                        "timestamptzns",
+                        arrow_schema::DataType::Timestamp(TimeUnit::Nanosecond, Some("UTC".into())),
+                        false,
+                    )
+                    .with_metadata(HashMap::from([(
+                        PARQUET_FIELD_ID_META_KEY.to_string(),
+                        "15".to_string(),
+                    )])),
+                    arrow_schema::Field::new("binary", arrow_schema::DataType::LargeBinary, false)
+                        .with_metadata(HashMap::from([(
+                            PARQUET_FIELD_ID_META_KEY.to_string(),
+                            "16".to_string(),
+                        )])),
                 ];
                 Arc::new(arrow_schema::Schema::new(fields))
             };
@@ -1441,8 +1551,54 @@ pub mod tests {
             let values: BooleanArray = values.into();
             let col8 = Arc::new(values) as ArrayRef;
 
+            // float:
+            let mut values = vec![100.0f32; 512];
+            values.append(vec![150.0f32; 12].as_mut());
+            values.append(vec![200.0f32; 500].as_mut());
+            let col9 = Arc::new(Float32Array::from_iter_values(values)) as ArrayRef;
+
+            // decimal:
+            let values = vec![123i128; 1024];
+            let col10 = Arc::new(
+                Decimal128Array::from_iter_values(values)
+                    .with_data_type(DataType::Decimal128(3, 2)),
+            );
+
+            // date:
+            let values = vec![0i32; 1024];
+            let col11 = Arc::new(Date32Array::from_iter_values(values));
+
+            // timestamp:
+            let values = vec![0i64; 1024];
+            let col12 = Arc::new(TimestampMicrosecondArray::from_iter_values(values));
+
+            // timestamptz:
+            let values = vec![0i64; 1024];
+            let col13 = Arc::new(
+                TimestampMicrosecondArray::from_iter_values(values).with_data_type(
+                    DataType::Timestamp(TimeUnit::Microsecond, Some("UTC".into())),
+                ),
+            );
+
+            // timestampns:
+            let values = vec![0i64; 1024];
+            let col14 = Arc::new(TimestampNanosecondArray::from_iter_values(values));
+
+            // timestamptzns:
+            let values = vec![0i64; 1024];
+            let col15 = Arc::new(
+                TimestampNanosecondArray::from_iter_values(values).with_data_type(
+                    DataType::Timestamp(TimeUnit::Nanosecond, Some("UTC".into())),
+                ),
+            );
+
+            // binary:
+            let values = vec![[0u8; 8]; 1024];
+            let col16 = Arc::new(LargeBinaryArray::from_iter_values(values));
+
             let to_write = RecordBatch::try_new(schema.clone(), vec![
-                col1, col2, col3, col4, col5, col6, col7, col8,
+                col1, col2, col3, col4, col5, col6, col7, col8, col9, col10, col11, col12, col13,
+                col14, col15, col16,
             ])
             .unwrap();
 
diff --git a/crates/iceberg/src/spec/manifest.rs b/crates/iceberg/src/spec/manifest.rs
index c82f353fe..b47591e88 100644
--- a/crates/iceberg/src/spec/manifest.rs
+++ b/crates/iceberg/src/spec/manifest.rs
@@ -1196,6 +1196,12 @@ impl ManifestEntry {
         self.sequence_number
     }
 
+    /// File sequence number.
+    #[inline]
+    pub fn file_sequence_number(&self) -> Option<i64> {
+        self.file_sequence_number
+    }
+
     /// File size in bytes.
     #[inline]
     pub fn file_size_in_bytes(&self) -> u64 {
diff --git a/crates/iceberg/testdata/example_table_metadata_v2.json b/crates/iceberg/testdata/example_table_metadata_v2.json
index 17bbd7d99..8ac937751 100644
--- a/crates/iceberg/testdata/example_table_metadata_v2.json
+++ b/crates/iceberg/testdata/example_table_metadata_v2.json
@@ -25,7 +25,15 @@
         {"id": 5, "name": "dbl", "required": true, "type": "double"},
         {"id": 6, "name": "i32", "required": true, "type": "int"},
         {"id": 7, "name": "i64", "required": true, "type": "long"},
-        {"id": 8, "name": "bool", "required": true, "type": "boolean"}
+        {"id": 8, "name": "bool", "required": true, "type": "boolean"},
+        {"id": 9, "name": "float", "required": true, "type": "float"},
+        {"id": 10, "name": "decimal", "required": true, "type": "decimal(3,2)"},
+        {"id": 11, "name": "date", "required": true, "type": "date"},
+        {"id": 12, "name": "timestamp", "required": true, "type": "timestamp"},
+        {"id": 13, "name": "timestamptz", "required": true, "type": "timestamptz"},
+        {"id": 14, "name": "timestampns", "required": true, "type": "timestamp_ns"},
+        {"id": 15, "name": "timestamptzns", "required": true, "type": "timestamptz_ns"},
+        {"id": 16, "name": "binary", "required": true, "type": "binary"}
       ]
     }
   ],

From 2d470062e5b060890d8bdcfbbd3425cf6e0d61ac Mon Sep 17 00:00:00 2001
From: Willi Raschkowski <wraschkowski@palantir.com>
Date: Sat, 8 Feb 2025 12:51:42 +0000
Subject: [PATCH 2/3] Iceberg schema

---
 Cargo.lock                                   |   2 +-
 crates/iceberg/src/arrow/schema.rs           | 187 ----
 crates/iceberg/src/inspect/entries.rs        | 894 +++++++++----------
 crates/iceberg/src/inspect/metadata_table.rs |  10 +-
 crates/iceberg/src/inspect/metrics.rs        | 428 +++++++++
 crates/iceberg/src/inspect/mod.rs            |   1 +
 crates/iceberg/src/spec/manifest.rs          |  30 +-
 crates/iceberg/src/spec/partition.rs         | 307 ++++++-
 8 files changed, 1168 insertions(+), 691 deletions(-)
 create mode 100644 crates/iceberg/src/inspect/metrics.rs

diff --git a/Cargo.lock b/Cargo.lock
index 18f4ffed5..c5dc68865 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -599,7 +599,7 @@ checksum = "c7c24de15d275a1ecfd47a380fb4d5ec9bfe0933f309ed5e705b775596a3574d"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.96",
+ "syn 2.0.98",
 ]
 
 [[package]]
diff --git a/crates/iceberg/src/arrow/schema.rs b/crates/iceberg/src/arrow/schema.rs
index 4928feb11..f4eae018f 100644
--- a/crates/iceberg/src/arrow/schema.rs
+++ b/crates/iceberg/src/arrow/schema.rs
@@ -827,193 +827,6 @@ get_parquet_stat_as_datum!(min);
 
 get_parquet_stat_as_datum!(max);
 
-/// Utilities to deal with [arrow_array::builder] types in the Iceberg context.
-pub(crate) mod builder {
-    use arrow_array::builder::*;
-    use arrow_array::cast::AsArray;
-    use arrow_array::types::*;
-    use arrow_array::{ArrayRef, Datum as ArrowDatum};
-    use arrow_schema::{DataType, TimeUnit};
-    use ordered_float::OrderedFloat;
-
-    use crate::spec::{Literal, PrimitiveLiteral};
-    use crate::{Error, ErrorKind};
-
-    /// A helper wrapping [ArrayBuilder] for building arrays without declaring the inner type at
-    /// compile-time when types are determined dynamically (e.g. based on some column type).
-    /// A [DataType] is given at construction time which is used to later downcast the inner array
-    /// and provided values.
-    pub(crate) struct AnyArrayBuilder {
-        data_type: DataType,
-        inner: Box<dyn ArrayBuilder>,
-    }
-
-    impl AnyArrayBuilder {
-        pub(crate) fn new(data_type: &DataType) -> Self {
-            Self {
-                data_type: data_type.clone(),
-                inner: make_builder(data_type, 0),
-            }
-        }
-
-        pub(crate) fn finish(&mut self) -> ArrayRef {
-            self.inner.finish()
-        }
-
-        /// Append an [[arrow_array::Datum]] value.
-        pub(crate) fn append_datum(&mut self, value: &dyn ArrowDatum) -> crate::Result<()> {
-            let (array, is_scalar) = value.get();
-            assert!(is_scalar, "Can only append scalar datum");
-
-            match array.data_type() {
-                DataType::Boolean => self
-                    .builder::<BooleanBuilder>()?
-                    .append_value(array.as_boolean().value(0)),
-                DataType::Int32 => self
-                    .builder::<Int32Builder>()?
-                    .append_value(array.as_primitive::<Int32Type>().value(0)),
-                DataType::Int64 => self
-                    .builder::<Int64Builder>()?
-                    .append_value(array.as_primitive::<Int64Type>().value(0)),
-                DataType::Float32 => self
-                    .builder::<Float32Builder>()?
-                    .append_value(array.as_primitive::<Float32Type>().value(0)),
-                DataType::Float64 => self
-                    .builder::<Float64Builder>()?
-                    .append_value(array.as_primitive::<Float64Type>().value(0)),
-                DataType::Decimal128(_, _) => self
-                    .builder::<Decimal128Builder>()?
-                    .append_value(array.as_primitive::<Decimal128Type>().value(0)),
-                DataType::Date32 => self
-                    .builder::<Date32Builder>()?
-                    .append_value(array.as_primitive::<Date32Type>().value(0)),
-                DataType::Time64(TimeUnit::Microsecond) => self
-                    .builder::<Time64MicrosecondBuilder>()?
-                    .append_value(array.as_primitive::<Time64MicrosecondType>().value(0)),
-                DataType::Timestamp(TimeUnit::Microsecond, _) => self
-                    .builder::<TimestampMicrosecondBuilder>()?
-                    .append_value(array.as_primitive::<TimestampMicrosecondType>().value(0)),
-                DataType::Timestamp(TimeUnit::Nanosecond, _) => self
-                    .builder::<TimestampNanosecondBuilder>()?
-                    .append_value(array.as_primitive::<TimestampNanosecondType>().value(0)),
-                DataType::Utf8 => self
-                    .builder::<StringBuilder>()?
-                    .append_value(array.as_string::<i32>().value(0)),
-                DataType::FixedSizeBinary(_) => self
-                    .builder::<BinaryBuilder>()?
-                    .append_value(array.as_fixed_size_binary().value(0)),
-                DataType::LargeBinary => self
-                    .builder::<LargeBinaryBuilder>()?
-                    .append_value(array.as_binary::<i64>().value(0)),
-                _ => {
-                    return Err(Error::new(
-                        ErrorKind::FeatureUnsupported,
-                        format!("Cannot append data type: {:?}", array.data_type(),),
-                    ));
-                }
-            }
-            Ok(())
-        }
-
-        /// Append a literal with the provided [DataType]. We're not solely relying on the literal to
-        /// infer the type because [Literal] values do not specify the expected type of builder. E.g.,
-        /// a [PrimitiveLiteral::Long] may go into an array builder for longs but also for timestamps.
-        pub(crate) fn append_literal(&mut self, value: &Literal) -> crate::Result<()> {
-            let Some(primitive) = value.as_primitive_literal() else {
-                return Err(Error::new(
-                    ErrorKind::FeatureUnsupported,
-                    "Expected primitive type",
-                ));
-            };
-
-            match (&self.data_type, primitive.clone()) {
-                (DataType::Boolean, PrimitiveLiteral::Boolean(value)) => {
-                    self.builder::<BooleanBuilder>()?.append_value(value)
-                }
-                (DataType::Int32, PrimitiveLiteral::Int(value)) => {
-                    self.builder::<Int32Builder>()?.append_value(value)
-                }
-                (DataType::Int64, PrimitiveLiteral::Long(value)) => {
-                    self.builder::<Int64Builder>()?.append_value(value)
-                }
-                (DataType::Float32, PrimitiveLiteral::Float(OrderedFloat(value))) => {
-                    self.builder::<Float32Builder>()?.append_value(value)
-                }
-                (DataType::Float64, PrimitiveLiteral::Double(OrderedFloat(value))) => {
-                    self.builder::<Float64Builder>()?.append_value(value)
-                }
-                (DataType::Utf8, PrimitiveLiteral::String(value)) => {
-                    self.builder::<StringBuilder>()?.append_value(value)
-                }
-                (DataType::FixedSizeBinary(_), PrimitiveLiteral::Binary(value)) => self
-                    .builder::<FixedSizeBinaryBuilder>()?
-                    .append_value(value)?,
-                (DataType::LargeBinary, PrimitiveLiteral::Binary(value)) => {
-                    self.builder::<LargeBinaryBuilder>()?.append_value(value)
-                }
-                (_, _) => {
-                    return Err(Error::new(
-                        ErrorKind::FeatureUnsupported,
-                        format!(
-                            "Builder of type {:?} does not accept literal {:?}",
-                            self.data_type, primitive
-                        ),
-                    ));
-                }
-            }
-
-            Ok(())
-        }
-
-        /// Append a null value for the provided [DataType].
-        pub(crate) fn append_null(&mut self) -> crate::Result<()> {
-            match self.data_type {
-                DataType::Boolean => self.builder::<BooleanBuilder>()?.append_null(),
-                DataType::Int32 => self.builder::<Int32Builder>()?.append_null(),
-                DataType::Int64 => self.builder::<Int64Builder>()?.append_null(),
-                DataType::Float32 => self.builder::<Float32Builder>()?.append_null(),
-                DataType::Float64 => self.builder::<Float64Builder>()?.append_null(),
-                DataType::Decimal128(_, _) => self.builder::<Decimal128Builder>()?.append_null(),
-                DataType::Date32 => self.builder::<Date32Builder>()?.append_null(),
-                DataType::Time64(TimeUnit::Microsecond) => {
-                    self.builder::<Time64MicrosecondBuilder>()?.append_null()
-                }
-                DataType::Timestamp(TimeUnit::Microsecond, _) => {
-                    self.builder::<TimestampMicrosecondBuilder>()?.append_null()
-                }
-                DataType::Timestamp(TimeUnit::Nanosecond, _) => {
-                    self.builder::<TimestampNanosecondBuilder>()?.append_null()
-                }
-                DataType::Utf8 => self.builder::<StringBuilder>()?.append_null(),
-                DataType::FixedSizeBinary(_) => {
-                    self.builder::<FixedSizeBinaryBuilder>()?.append_null()
-                }
-                DataType::LargeBinary => self.builder::<LargeBinaryBuilder>()?.append_null(),
-                _ => {
-                    return Err(Error::new(
-                        ErrorKind::FeatureUnsupported,
-                        format!(
-                            "Cannot append null values for data type: {:?}",
-                            self.data_type
-                        ),
-                    ))
-                }
-            }
-            Ok(())
-        }
-
-        /// Cast the `inner` builder to a specific type or return [Error].
-        fn builder<T: ArrayBuilder>(&mut self) -> crate::Result<&mut T> {
-            self.inner.as_any_mut().downcast_mut::<T>().ok_or_else(|| {
-                Error::new(
-                    ErrorKind::Unexpected,
-                    "Failed to cast builder to expected type",
-                )
-            })
-        }
-    }
-}
-
 impl TryFrom<&ArrowSchema> for crate::spec::Schema {
     type Error = Error;
 
diff --git a/crates/iceberg/src/inspect/entries.rs b/crates/iceberg/src/inspect/entries.rs
index 02d33229e..c25452356 100644
--- a/crates/iceberg/src/inspect/entries.rs
+++ b/crates/iceberg/src/inspect/entries.rs
@@ -15,23 +15,30 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use std::collections::HashMap;
+use std::any::type_name;
+use std::string::ToString;
 use std::sync::Arc;
 
 use arrow_array::builder::{
-    BinaryBuilder, Int32Builder, Int64Builder, Int8Builder, ListBuilder, MapBuilder, StringBuilder,
+    ArrayBuilder, BooleanBuilder, Date32Builder, Decimal128Builder, FixedSizeBinaryBuilder,
+    Float32Builder, Float64Builder, Int32Builder, Int64Builder, LargeBinaryBuilder, ListBuilder,
+    MapBuilder, PrimitiveBuilder, StringBuilder, StructBuilder, TimestampMicrosecondBuilder,
+    TimestampNanosecondBuilder,
 };
-use arrow_array::{ArrayRef, RecordBatch, StructArray};
-use arrow_schema::{DataType, Field, FieldRef, Fields, Schema};
+use arrow_array::types::{Int32Type, Int64Type};
+use arrow_array::{ArrowPrimitiveType, RecordBatch, StructArray};
+use arrow_schema::{DataType, Fields, TimeUnit};
 use async_stream::try_stream;
 use futures::StreamExt;
 use itertools::Itertools;
+use ordered_float::OrderedFloat;
 
-use crate::arrow::builder::AnyArrayBuilder;
-use crate::arrow::{get_arrow_datum, schema_to_arrow_schema, type_to_arrow_type};
+use crate::arrow::{schema_to_arrow_schema, type_to_arrow_type};
+use crate::inspect::metrics::ReadableMetricsStructBuilder;
 use crate::scan::ArrowRecordBatchStream;
 use crate::spec::{
-    DataFile, ManifestFile, PartitionField, PartitionSpec, SchemaRef, Struct, TableMetadata,
+    DataFile, Datum, ManifestFile, NestedFieldRef, PrimitiveLiteral, Schema, Struct, TableMetadata,
+    Type,
 };
 use crate::table::Table;
 use crate::{Error, ErrorKind, Result};
@@ -52,29 +59,6 @@ impl<'a> EntriesTable<'a> {
         Self { table }
     }
 
-    /// Get the schema for the manifest entries table.
-    pub fn schema(&self) -> Schema {
-        Schema::new(vec![
-            Field::new("status", DataType::Int32, false),
-            Field::new("snapshot_id", DataType::Int64, true),
-            Field::new("sequence_number", DataType::Int64, true),
-            Field::new("file_sequence_number", DataType::Int64, true),
-            Field::new(
-                "data_file",
-                DataType::Struct(DataFileStructBuilder::fields(self.table.metadata())),
-                false,
-            ),
-            Field::new(
-                "readable_metrics",
-                DataType::Struct(
-                    ReadableMetricsStructBuilder::fields(self.table.metadata().current_schema())
-                        .expect("Failed to build schema for readable metrics"),
-                ),
-                false,
-            ),
-        ])
-    }
-
     /// Scan the manifest entries table.
     pub async fn scan(&self) -> Result<ArrowRecordBatchStream> {
         let current_snapshot = self.table.metadata().current_snapshot().ok_or_else(|| {
@@ -89,9 +73,14 @@ impl<'a> EntriesTable<'a> {
             .await?;
 
         // Copy to ensure that the stream can take ownership of these dependencies
-        let arrow_schema = Arc::new(self.schema());
+        let schema = self.schema();
+        let arrow_schema = Arc::new(schema_to_arrow_schema(&schema)?);
         let table_metadata = self.table.metadata_ref();
         let file_io = Arc::new(self.table.file_io().clone());
+        let readable_metrics_schema = schema
+            .field_by_name("readable_metrics")
+            .and_then(|field| field.field_type.clone().to_struct_type())
+            .unwrap();
 
         Ok(try_stream! {
             for manifest_file in manifest_list.entries() {
@@ -99,9 +88,10 @@ impl<'a> EntriesTable<'a> {
                 let mut snapshot_id = Int64Builder::new();
                 let mut sequence_number = Int64Builder::new();
                 let mut file_sequence_number = Int64Builder::new();
-                let mut data_file = DataFileStructBuilder::new(&table_metadata);
+                let mut data_file = DataFileStructBuilder::new(&table_metadata)?;
                 let mut readable_metrics =
-                    ReadableMetricsStructBuilder::new(table_metadata.current_schema())?;
+                    ReadableMetricsStructBuilder::new(
+                    table_metadata.current_schema(), &readable_metrics_schema)?;
 
                 for manifest_entry in manifest_file.load_manifest(&file_io).await?.entries() {
                     status.append_value(manifest_entry.status() as i32);
@@ -126,6 +116,22 @@ impl<'a> EntriesTable<'a> {
         }
         .boxed())
     }
+
+    /// Get the schema for the manifest entries table.
+    pub fn schema(&self) -> Schema {
+        let partition_type = crate::spec::partition_type(self.table.metadata()).unwrap();
+        let schema = Schema::builder()
+            .with_fields(crate::spec::_const_schema::manifest_schema_fields_v2(
+                &partition_type,
+            ))
+            .build()
+            .unwrap();
+        let readable_metric_schema = ReadableMetricsStructBuilder::readable_metrics_schema(
+            self.table.metadata().current_schema(),
+            &schema,
+        );
+        join_schemas(&schema, &readable_metric_schema.unwrap()).unwrap()
+    }
 }
 
 /// Builds the struct describing data files listed in a table manifest.
@@ -134,500 +140,423 @@ impl<'a> EntriesTable<'a> {
 ///
 /// [1]: https://github.com/apache/iceberg/blob/apache-iceberg-1.7.1/api/src/main/java/org/apache/iceberg/DataFile.java
 struct DataFileStructBuilder<'a> {
-    // Reference to table metadata to retrieve partition specs based on partition spec ids
+    /// Builder for data file struct (including the partition struct).
+    struct_builder: StructBuilder,
+    /// Arrow fields of the combined partition struct of all partition specs.
+    /// We require this to reconstruct the field builders in the partition [`StructBuilder`].
+    combined_partition_fields: Fields,
+    /// Table metadata to look up partition specs by partition spec id.
     table_metadata: &'a TableMetadata,
-    // Below are the field builders of the "data_file" struct
-    content: Int8Builder,
-    file_path: StringBuilder,
-    file_format: StringBuilder,
-    partition: PartitionValuesStructBuilder,
-    record_count: Int64Builder,
-    file_size_in_bytes: Int64Builder,
-    column_sizes: MapBuilder<Int32Builder, Int64Builder>,
-    value_counts: MapBuilder<Int32Builder, Int64Builder>,
-    null_value_counts: MapBuilder<Int32Builder, Int64Builder>,
-    nan_value_counts: MapBuilder<Int32Builder, Int64Builder>,
-    lower_bounds: MapBuilder<Int32Builder, BinaryBuilder>,
-    upper_bounds: MapBuilder<Int32Builder, BinaryBuilder>,
-    key_metadata: BinaryBuilder,
-    split_offsets: ListBuilder<Int64Builder>,
-    equality_ids: ListBuilder<Int32Builder>,
-    sort_order_ids: Int32Builder,
 }
 
 impl<'a> DataFileStructBuilder<'a> {
-    fn new(table_metadata: &'a TableMetadata) -> Self {
-        Self {
+    fn new(table_metadata: &'a TableMetadata) -> Result<Self> {
+        let combined_partition_type = crate::spec::partition_type(table_metadata)?;
+        let data_file_fields =
+            crate::spec::_const_schema::data_file_fields_v2(&combined_partition_type);
+        let data_file_schema = Schema::builder().with_fields(data_file_fields).build()?;
+        let DataType::Struct(combined_partition_fields) =
+            type_to_arrow_type(&Type::Struct(combined_partition_type))?
+        else {
+            panic!("Converted Arrow type was not struct")
+        };
+
+        Ok(DataFileStructBuilder {
+            struct_builder: StructBuilder::from_fields(
+                schema_to_arrow_schema(&data_file_schema)?.fields,
+                0,
+            ),
+            combined_partition_fields,
             table_metadata,
-            content: Int8Builder::new(),
-            file_path: StringBuilder::new(),
-            file_format: StringBuilder::new(),
-            partition: PartitionValuesStructBuilder::new(table_metadata),
-            record_count: Int64Builder::new(),
-            file_size_in_bytes: Int64Builder::new(),
-            column_sizes: MapBuilder::new(None, Int32Builder::new(), Int64Builder::new()),
-            value_counts: MapBuilder::new(None, Int32Builder::new(), Int64Builder::new()),
-            null_value_counts: MapBuilder::new(None, Int32Builder::new(), Int64Builder::new()),
-            nan_value_counts: MapBuilder::new(None, Int32Builder::new(), Int64Builder::new()),
-            lower_bounds: MapBuilder::new(None, Int32Builder::new(), BinaryBuilder::new()),
-            upper_bounds: MapBuilder::new(None, Int32Builder::new(), BinaryBuilder::new()),
-            key_metadata: BinaryBuilder::new(),
-            split_offsets: ListBuilder::new(Int64Builder::new()),
-            equality_ids: ListBuilder::new(Int32Builder::new()),
-            sort_order_ids: Int32Builder::new(),
-        }
+        })
     }
 
-    fn fields(table_metadata: &TableMetadata) -> Fields {
-        vec![
-            Field::new("content", DataType::Int8, false),
-            Field::new("file_path", DataType::Utf8, false),
-            Field::new("file_format", DataType::Utf8, false),
-            Field::new(
-                "partition",
-                DataType::Struct(PartitionValuesStructBuilder::combined_partition_fields(
-                    table_metadata,
-                )),
-                false,
-            ),
-            Field::new("record_count", DataType::Int64, false),
-            Field::new("file_size_in_bytes", DataType::Int64, false),
-            Field::new(
-                "column_sizes",
-                Self::column_id_to_value_type(DataType::Int64),
-                true,
-            ),
-            Field::new(
-                "value_counts",
-                Self::column_id_to_value_type(DataType::Int64),
-                true,
-            ),
-            Field::new(
-                "null_value_counts",
-                Self::column_id_to_value_type(DataType::Int64),
-                true,
-            ),
-            Field::new(
-                "nan_value_counts",
-                Self::column_id_to_value_type(DataType::Int64),
-                true,
-            ),
-            Field::new(
-                "lower_bounds",
-                Self::column_id_to_value_type(DataType::Binary),
-                true,
-            ),
-            Field::new(
-                "upper_bounds",
-                Self::column_id_to_value_type(DataType::Binary),
-                true,
-            ),
-            Field::new("key_metadata", DataType::Binary, true),
-            Field::new(
-                "split_offsets",
-                DataType::new_list(DataType::Int64, true),
-                true,
-            ),
-            Field::new(
-                "equality_ids",
-                DataType::new_list(DataType::Int32, true),
-                true,
-            ),
-            Field::new("sort_order_id", DataType::Int32, true),
-        ]
-        .into()
-    }
+    fn append(&mut self, manifest_file: &ManifestFile, data_file: &DataFile) -> Result<()> {
+        // Content type
+        self.field_builder::<Int32Builder>(0)?
+            .append_value(data_file.content as i32);
 
-    /// Construct a new struct type that maps from column ids (i32) to the provided value type.
-    /// Keys, values, and the whole struct are non-nullable.
-    fn column_id_to_value_type(value_type: DataType) -> DataType {
-        DataType::Map(
-            Arc::new(Field::new(
-                "entries",
-                DataType::Struct(
-                    vec![
-                        Field::new("keys", DataType::Int32, false),
-                        Field::new("values", value_type, true),
-                    ]
-                    .into(),
-                ),
-                false,
-            )),
-            false,
-        )
-    }
+        // File path
+        self.field_builder::<StringBuilder>(1)?
+            .append_value(data_file.file_path());
 
-    fn append(&mut self, manifest_file: &ManifestFile, data_file: &DataFile) -> Result<()> {
-        self.content.append_value(data_file.content as i8);
-        self.file_path.append_value(data_file.file_path());
-        self.file_format
+        // File format
+        self.field_builder::<StringBuilder>(2)?
             .append_value(data_file.file_format().to_string().to_uppercase());
-        self.partition.append(
-            self.partition_spec(manifest_file)?.clone().fields(),
-            data_file.partition(),
-        )?;
-        self.record_count
-            .append_value(data_file.record_count() as i64);
-        self.file_size_in_bytes
-            .append_value(data_file.file_size_in_bytes() as i64);
 
-        // Sort keys to get matching order between rows
-        for (k, v) in data_file.column_sizes.iter().sorted_by_key(|(k, _)| *k) {
-            self.column_sizes.keys().append_value(*k);
-            self.column_sizes.values().append_value(*v as i64);
-        }
-        self.column_sizes.append(true)?;
+        // Partitions
+        self.append_partition_values(manifest_file.partition_spec_id, data_file.partition())?;
 
-        for (k, v) in data_file.value_counts.iter().sorted_by_key(|(k, _)| *k) {
-            self.value_counts.keys().append_value(*k);
-            self.value_counts.values().append_value(*v as i64);
-        }
-        self.value_counts.append(true)?;
+        // Record count
+        self.field_builder::<Int64Builder>(4)?
+            .append_value(data_file.record_count() as i64);
+
+        // File size in bytes
+        self.field_builder::<Int64Builder>(5)?
+            .append_value(data_file.file_size_in_bytes() as i64);
 
-        for (k, v) in data_file
-            .null_value_counts
+        // Column sizes
+        let (column_size_keys, column_size_values): (Vec<i32>, Vec<i64>) = data_file
+            .column_sizes()
             .iter()
             .sorted_by_key(|(k, _)| *k)
-        {
-            self.null_value_counts.keys().append_value(*k);
-            self.null_value_counts.values().append_value(*v as i64);
-        }
-        self.null_value_counts.append(true)?;
-
-        for (k, v) in data_file.nan_value_counts.iter().sorted_by_key(|(k, _)| *k) {
-            self.nan_value_counts.keys().append_value(*k);
-            self.nan_value_counts.values().append_value(*v as i64);
-        }
-        self.nan_value_counts.append(true)?;
+            .map(|(k, v)| (k, *v as i64))
+            .unzip();
+        self.append_to_map_field::<Int32Builder, Int64Builder>(
+            6,
+            |key_builder| key_builder.append_slice(column_size_keys.as_slice()),
+            |value_builder| value_builder.append_slice(column_size_values.as_slice()),
+        )?;
 
-        for (k, v) in data_file.lower_bounds.iter().sorted_by_key(|(k, _)| *k) {
-            self.lower_bounds.keys().append_value(*k);
-            self.lower_bounds.values().append_value(v.to_bytes()?);
-        }
-        self.lower_bounds.append(true)?;
+        // Value counts
+        let (value_count_keys, value_count_values): (Vec<i32>, Vec<i64>) = data_file
+            .value_counts()
+            .iter()
+            .sorted_by_key(|(k, _)| *k)
+            .map(|(k, v)| (k, *v as i64))
+            .unzip();
+        self.append_to_primitive_map_field::<Int32Type, Int64Type>(
+            7,
+            value_count_keys.as_slice(),
+            value_count_values.as_slice(),
+        )?;
 
-        for (k, v) in data_file.upper_bounds.iter().sorted_by_key(|(k, _)| *k) {
-            self.upper_bounds.keys().append_value(*k);
-            self.upper_bounds.values().append_value(v.to_bytes()?);
-        }
-        self.upper_bounds.append(true)?;
+        // Null value counts
+        let (null_count_keys, null_count_values): (Vec<i32>, Vec<i64>) = data_file
+            .null_value_counts()
+            .iter()
+            .sorted_by_key(|(k, _)| *k)
+            .map(|(k, v)| (k, *v as i64))
+            .unzip();
+        self.append_to_primitive_map_field::<Int32Type, Int64Type>(
+            8,
+            null_count_keys.as_slice(),
+            null_count_values.as_slice(),
+        )?;
 
-        self.key_metadata.append_option(data_file.key_metadata());
+        // Nan value counts
+        let (nan_count_keys, nan_count_values): (Vec<i32>, Vec<i64>) = data_file
+            .nan_value_counts()
+            .iter()
+            .sorted_by_key(|(k, _)| *k)
+            .map(|(k, v)| (k, *v as i64))
+            .unzip();
+        self.append_to_primitive_map_field::<Int32Type, Int64Type>(
+            9,
+            nan_count_keys.as_slice(),
+            nan_count_values.as_slice(),
+        )?;
 
-        self.split_offsets
-            .values()
-            .append_slice(data_file.split_offsets());
-        self.split_offsets.append(true);
+        // Lower bounds
+        let (lower_bound_keys, lower_bound_values): (Vec<i32>, Vec<Datum>) = data_file
+            .lower_bounds()
+            .iter()
+            .sorted_by_key(|(k, _)| *k)
+            .map(|(k, v)| (k, v.clone()))
+            .unzip();
+        self.append_to_map_field::<Int32Builder, LargeBinaryBuilder>(
+            10,
+            |key_builder| key_builder.append_slice(lower_bound_keys.as_slice()),
+            |value_builder| {
+                for v in &lower_bound_values {
+                    value_builder.append_value(v.to_bytes().unwrap())
+                }
+            },
+        )?;
 
-        self.equality_ids
-            .values()
-            .append_slice(data_file.equality_ids());
-        self.equality_ids.append(true);
+        // Upper bounds
+        let (upper_bound_keys, upper_bound_values): (Vec<i32>, Vec<Datum>) = data_file
+            .upper_bounds()
+            .iter()
+            .sorted_by_key(|(k, _)| *k)
+            .map(|(k, v)| (k, v.clone()))
+            .unzip();
+        self.append_to_map_field::<Int32Builder, LargeBinaryBuilder>(
+            11,
+            |key_builder| key_builder.append_slice(upper_bound_keys.as_slice()),
+            |value_builder| {
+                for v in &upper_bound_values {
+                    value_builder.append_value(v.to_bytes().unwrap())
+                }
+            },
+        )?;
 
-        self.sort_order_ids.append_option(data_file.sort_order_id());
-        Ok(())
-    }
+        // Key metadata
+        self.field_builder::<LargeBinaryBuilder>(12)?
+            .append_option(data_file.key_metadata());
 
-    fn partition_spec(&self, manifest_file: &ManifestFile) -> Result<&PartitionSpec> {
-        self.table_metadata
-            .partition_spec_by_id(manifest_file.partition_spec_id)
-            .ok_or_else(|| {
-                Error::new(
-                    ErrorKind::Unexpected,
-                    "Partition spec not found for manifest file",
-                )
-            })
-            .map(|spec| spec.as_ref())
-    }
+        // Split offsets
+        self.append_to_list_field::<Int64Type>(13, data_file.split_offsets())?;
 
-    fn finish(&mut self) -> StructArray {
-        let inner_arrays: Vec<ArrayRef> = vec![
-            Arc::new(self.content.finish()),
-            Arc::new(self.file_path.finish()),
-            Arc::new(self.file_format.finish()),
-            Arc::new(self.partition.finish()),
-            Arc::new(self.record_count.finish()),
-            Arc::new(self.file_size_in_bytes.finish()),
-            Arc::new(self.column_sizes.finish()),
-            Arc::new(self.value_counts.finish()),
-            Arc::new(self.null_value_counts.finish()),
-            Arc::new(self.nan_value_counts.finish()),
-            Arc::new(self.lower_bounds.finish()),
-            Arc::new(self.upper_bounds.finish()),
-            Arc::new(self.key_metadata.finish()),
-            Arc::new(self.split_offsets.finish()),
-            Arc::new(self.equality_ids.finish()),
-            Arc::new(self.sort_order_ids.finish()),
-        ];
-
-        StructArray::from(
-            Self::fields(self.table_metadata)
-                .into_iter()
-                .cloned()
-                .zip_eq(inner_arrays)
-                .collect::<Vec<(FieldRef, ArrayRef)>>(),
-        )
-    }
-}
+        // Equality ids
+        self.append_to_list_field::<Int32Type>(14, data_file.equality_ids())?;
 
-/// Builds a readable metrics struct for a single column.
-///
-/// For reference, see [Java][1] and [Python][2] implementations.
-///
-/// [1]: https://github.com/apache/iceberg/blob/4a432839233f2343a9eae8255532f911f06358ef/core/src/main/java/org/apache/iceberg/MetricsUtil.java#L337
-/// [2]: https://github.com/apache/iceberg-python/blob/a051584a3684392d2db6556449eb299145d47d15/pyiceberg/table/inspect.py#L101-L110
-struct PerColumnReadableMetricsBuilder {
-    field_id: i32,
-    data_type: DataType,
-    column_size: Int64Builder,
-    value_count: Int64Builder,
-    null_value_count: Int64Builder,
-    nan_value_count: Int64Builder,
-    lower_bound: AnyArrayBuilder,
-    upper_bound: AnyArrayBuilder,
-}
+        // Sort order ids
+        self.field_builder::<Int32Builder>(15)?
+            .append_option(data_file.sort_order_id());
 
-impl PerColumnReadableMetricsBuilder {
-    fn fields(data_type: &DataType) -> Fields {
-        vec![
-            Field::new("column_size", DataType::Int64, true),
-            Field::new("value_count", DataType::Int64, true),
-            Field::new("null_value_count", DataType::Int64, true),
-            Field::new("nan_value_count", DataType::Int64, true),
-            Field::new("lower_bound", data_type.clone(), true),
-            Field::new("upper_bound", data_type.clone(), true),
-        ]
-        .into()
+        // Append an element in the struct
+        self.struct_builder.append(true);
+        Ok(())
     }
 
-    fn new_for_field(field_id: i32, data_type: &DataType) -> Self {
-        Self {
-            field_id,
-            data_type: data_type.clone(),
-            column_size: Int64Builder::new(),
-            value_count: Int64Builder::new(),
-            null_value_count: Int64Builder::new(),
-            nan_value_count: Int64Builder::new(),
-            lower_bound: AnyArrayBuilder::new(data_type),
-            upper_bound: AnyArrayBuilder::new(data_type),
-        }
+    fn field_builder<T: ArrayBuilder>(&mut self, index: usize) -> Result<&mut T> {
+        self.struct_builder.field_builder_or_err::<T>(index)
     }
 
-    fn append(&mut self, data_file: &DataFile) -> Result<()> {
-        self.column_size.append_option(
-            data_file
-                .column_sizes()
-                .get(&self.field_id)
-                .map(|&v| v as i64),
-        );
-        self.value_count.append_option(
-            data_file
-                .value_counts()
-                .get(&self.field_id)
-                .map(|&v| v as i64),
-        );
-        self.null_value_count.append_option(
-            data_file
-                .null_value_counts()
-                .get(&self.field_id)
-                .map(|&v| v as i64),
-        );
-        self.nan_value_count.append_option(
-            data_file
-                .nan_value_counts()
-                .get(&self.field_id)
-                .map(|&v| v as i64),
-        );
-        match data_file.lower_bounds().get(&self.field_id) {
-            Some(datum) => self
-                .lower_bound
-                .append_datum(get_arrow_datum(datum)?.as_ref())?,
-            None => self.lower_bound.append_null()?,
-        }
-        match data_file.upper_bounds().get(&self.field_id) {
-            Some(datum) => self
-                .upper_bound
-                .append_datum(get_arrow_datum(datum)?.as_ref())?,
-            None => self.upper_bound.append_null()?,
-        }
+    fn append_to_list_field<T: ArrowPrimitiveType>(
+        &mut self,
+        index: usize,
+        values: &[T::Native],
+    ) -> Result<()> {
+        let list_builder = self.field_builder::<ListBuilder<Box<dyn ArrayBuilder>>>(index)?;
+        list_builder
+            .values()
+            .cast_or_err::<PrimitiveBuilder<T>>()?
+            .append_slice(values);
+        list_builder.append(true);
         Ok(())
     }
 
-    fn finish(&mut self) -> StructArray {
-        let inner_arrays: Vec<ArrayRef> = vec![
-            Arc::new(self.column_size.finish()),
-            Arc::new(self.value_count.finish()),
-            Arc::new(self.null_value_count.finish()),
-            Arc::new(self.nan_value_count.finish()),
-            Arc::new(self.lower_bound.finish()),
-            Arc::new(self.upper_bound.finish()),
-        ];
-
-        StructArray::from(
-            Self::fields(&self.data_type)
-                .into_iter()
-                .cloned()
-                .zip_eq(inner_arrays)
-                .collect::<Vec<(FieldRef, ArrayRef)>>(),
-        )
-    }
-}
-
-/// Build a [StructArray] with partition columns as fields and partition values as rows.
-struct PartitionValuesStructBuilder {
-    fields: Fields,
-    builders: Vec<AnyArrayBuilder>,
-}
-
-impl PartitionValuesStructBuilder {
-    /// Construct a new builder from the combined partition columns of the table metadata.
-    fn new(table_metadata: &TableMetadata) -> Self {
-        let combined_fields = Self::combined_partition_fields(table_metadata);
-        Self {
-            builders: combined_fields
-                .iter()
-                .map(|field| AnyArrayBuilder::new(field.data_type()))
-                .collect_vec(),
-            fields: combined_fields,
-        }
+    fn append_to_map_field<K: ArrayBuilder, V: ArrayBuilder>(
+        &mut self,
+        index: usize,
+        key_func: impl Fn(&mut K),
+        value_func: impl Fn(&mut V),
+    ) -> Result<()> {
+        let map_builder =
+            self.field_builder::<MapBuilder<Box<dyn ArrayBuilder>, Box<dyn ArrayBuilder>>>(index)?;
+        key_func(map_builder.keys().cast_or_err::<K>()?);
+        value_func(map_builder.values().cast_or_err::<V>()?);
+        Ok(map_builder.append(true)?)
     }
 
-    /// Build the combined partition spec union-ing past and current partition specs
-    fn combined_partition_fields(table_metadata: &TableMetadata) -> Fields {
-        let combined_fields: HashMap<i32, &PartitionField> = table_metadata
-            .partition_specs_iter()
-            .flat_map(|spec| spec.fields())
-            .map(|field| (field.field_id, field))
-            .collect();
-
-        combined_fields
-            .into_iter()
-            // Sort by field id to get a deterministic order
-            .sorted_by_key(|(id, _)| *id)
-            .map(|(_, field)| {
-                let source_type = &table_metadata
-                    .current_schema()
-                    .field_by_id(field.source_id)
-                    .unwrap()
-                    .field_type;
-                let result_type = field.transform.result_type(source_type).unwrap();
-                Field::new(
-                    field.name.clone(),
-                    type_to_arrow_type(&result_type).unwrap(),
-                    true,
-                )
-            })
-            .collect()
+    fn append_to_primitive_map_field<K: ArrowPrimitiveType, V: ArrowPrimitiveType>(
+        &mut self,
+        index: usize,
+        keys: &[K::Native],
+        values: &[V::Native],
+    ) -> Result<()> {
+        let map_builder =
+            self.field_builder::<MapBuilder<Box<dyn ArrayBuilder>, Box<dyn ArrayBuilder>>>(index)?;
+        map_builder
+            .keys()
+            .cast_or_err::<PrimitiveBuilder<K>>()?
+            .append_slice(keys);
+        map_builder
+            .values()
+            .cast_or_err::<PrimitiveBuilder<V>>()?
+            .append_slice(values);
+        Ok(map_builder.append(true)?)
     }
 
-    fn append(
+    fn append_partition_values(
         &mut self,
-        partition_fields: &[PartitionField],
+        partition_spec_id: i32,
         partition_values: &Struct,
     ) -> Result<()> {
-        for (field, value) in partition_fields.iter().zip_eq(partition_values.iter()) {
-            let index = self.find_field(&field.name)?;
-
-            match value {
-                Some(literal) => self.builders[index].append_literal(literal)?,
-                None => self.builders[index].append_null()?,
+        // Get the partition fields for the partition spec id in the manifest file
+        let partition_spec = self
+            .table_metadata
+            .partition_spec_by_id(partition_spec_id)
+            .ok_or_else(|| Error::new(ErrorKind::Unexpected, "Partition spec not found"))?
+            .fields();
+        // Clone here so we don't hold an immutable reference as we mutably-borrow the builder below
+        let combined_partition_fields = self.combined_partition_fields.clone();
+        // Get the partition struct builder
+        let partition_builder = self.field_builder::<StructBuilder>(3)?;
+        // Iterate the manifest's partition fields with the respect partition values from the data file
+        for (partition_field, partition_value) in
+            partition_spec.iter().zip_eq(partition_values.iter())
+        {
+            let (combined_index, combined_partition_spec_field) = combined_partition_fields
+                .find(&partition_field.name)
+                .ok_or_else(|| Error::new(ErrorKind::Unexpected, "Partition field not found"))?;
+            let partition_type = combined_partition_spec_field.data_type();
+            let partition_value: Option<PrimitiveLiteral> = partition_value
+                .map(|value| -> std::result::Result<PrimitiveLiteral, Error> {
+                    value.as_primitive_literal().ok_or({
+                        Error::new(
+                            ErrorKind::FeatureUnsupported,
+                            "Only primitive types support in partition struct",
+                        )
+                    })
+                })
+                .transpose()?;
+
+            // Append a literal to a field builder cast based on the expected partition field type.
+            // We cannot solely rely on the literal type, because it doesn't sufficiently specify
+            // the underlying type. E.g., a `PrimtivieLiteral::Long` could represent either a long
+            // or a timestamp.
+            match (partition_type, partition_value.clone()) {
+                (DataType::Boolean, Some(PrimitiveLiteral::Boolean(value))) => partition_builder
+                    .field_builder_or_err::<BooleanBuilder>(combined_index)?
+                    .append_value(value),
+                (DataType::Boolean, None) => partition_builder
+                    .field_builder_or_err::<BooleanBuilder>(combined_index)?
+                    .append_null(),
+                (DataType::Int32, Some(PrimitiveLiteral::Int(value))) => partition_builder
+                    .field_builder_or_err::<Int32Builder>(combined_index)?
+                    .append_value(value),
+                (DataType::Int32, None) => partition_builder
+                    .field_builder_or_err::<Int32Builder>(combined_index)?
+                    .append_null(),
+                (DataType::Int64, Some(PrimitiveLiteral::Long(value))) => partition_builder
+                    .field_builder_or_err::<Int64Builder>(combined_index)?
+                    .append_value(value),
+                (DataType::Int64, None) => partition_builder
+                    .field_builder_or_err::<Int64Builder>(combined_index)?
+                    .append_null(),
+                (DataType::Float32, Some(PrimitiveLiteral::Float(OrderedFloat(value)))) => {
+                    partition_builder
+                        .field_builder_or_err::<Float32Builder>(combined_index)?
+                        .append_value(value)
+                }
+                (DataType::Float32, None) => partition_builder
+                    .field_builder_or_err::<Float32Builder>(combined_index)?
+                    .append_null(),
+                (DataType::Float64, Some(PrimitiveLiteral::Double(OrderedFloat(value)))) => {
+                    partition_builder
+                        .field_builder_or_err::<Float64Builder>(combined_index)?
+                        .append_value(value)
+                }
+                (DataType::Float64, None) => partition_builder
+                    .field_builder_or_err::<Float64Builder>(combined_index)?
+                    .append_null(),
+                (DataType::Utf8, Some(PrimitiveLiteral::String(value))) => partition_builder
+                    .field_builder_or_err::<StringBuilder>(combined_index)?
+                    .append_value(value),
+                (DataType::Utf8, None) => partition_builder
+                    .field_builder_or_err::<StringBuilder>(combined_index)?
+                    .append_null(),
+                (DataType::FixedSizeBinary(_), Some(PrimitiveLiteral::Binary(value))) => {
+                    partition_builder
+                        .field_builder_or_err::<FixedSizeBinaryBuilder>(combined_index)?
+                        .append_value(value)?
+                }
+                (DataType::FixedSizeBinary(_), None) => partition_builder
+                    .field_builder_or_err::<FixedSizeBinaryBuilder>(combined_index)?
+                    .append_null(),
+                (DataType::LargeBinary, Some(PrimitiveLiteral::Binary(value))) => partition_builder
+                    .field_builder_or_err::<LargeBinaryBuilder>(combined_index)?
+                    .append_value(value),
+                (DataType::LargeBinary, None) => partition_builder
+                    .field_builder_or_err::<LargeBinaryBuilder>(combined_index)?
+                    .append_null(),
+                (DataType::Date32, Some(PrimitiveLiteral::Int(value))) => partition_builder
+                    .field_builder_or_err::<Date32Builder>(combined_index)?
+                    .append_value(value),
+                (DataType::Date32, None) => partition_builder
+                    .field_builder_or_err::<Date32Builder>(combined_index)?
+                    .append_null(),
+                (
+                    DataType::Timestamp(TimeUnit::Microsecond, _),
+                    Some(PrimitiveLiteral::Long(value)),
+                ) => partition_builder
+                    .field_builder_or_err::<TimestampMicrosecondBuilder>(combined_index)?
+                    .append_value(value),
+                (DataType::Timestamp(TimeUnit::Microsecond, _), None) => partition_builder
+                    .field_builder_or_err::<TimestampMicrosecondBuilder>(combined_index)?
+                    .append_null(),
+                (
+                    DataType::Timestamp(TimeUnit::Nanosecond, _),
+                    Some(PrimitiveLiteral::Long(value)),
+                ) => partition_builder
+                    .field_builder_or_err::<TimestampNanosecondBuilder>(combined_index)?
+                    .append_value(value),
+                (DataType::Timestamp(TimeUnit::Nanosecond, _), None) => partition_builder
+                    .field_builder_or_err::<TimestampNanosecondBuilder>(combined_index)?
+                    .append_null(),
+                (DataType::Decimal128(_, _), Some(PrimitiveLiteral::Int128(value))) => {
+                    partition_builder
+                        .field_builder_or_err::<Decimal128Builder>(combined_index)?
+                        .append_value(value)
+                }
+                (DataType::Decimal128(_, _), None) => partition_builder
+                    .field_builder_or_err::<Decimal128Builder>(combined_index)?
+                    .append_null(),
+                (_, _) => {
+                    return Err(Error::new(
+                        ErrorKind::FeatureUnsupported,
+                        format!(
+                            "Cannot build partition struct with field type {:?} and partition value {:?}",
+                            partition_type, partition_value
+                        ),
+                    ));
+                }
             }
         }
+
+        // Append an element in the struct
+        partition_builder.append(true);
         Ok(())
     }
 
     fn finish(&mut self) -> StructArray {
-        let arrays: Vec<ArrayRef> = self
-            .builders
-            .iter_mut()
-            .map::<ArrayRef, _>(|builder| Arc::new(builder.finish()))
-            .collect();
-        StructArray::from(
-            self.fields
-                .iter()
-                .cloned()
-                .zip_eq(arrays)
-                .collect::<Vec<(FieldRef, ArrayRef)>>(),
-        )
+        self.struct_builder.finish()
     }
+}
 
-    fn find_field(&self, name: &str) -> Result<usize> {
-        match self.fields.find(name) {
-            Some((index, _)) => Ok(index),
-            None => Err(Error::new(
-                ErrorKind::Unexpected,
-                format!("Field not found: {}", name),
-            )),
+/// Join two schemas by concatenating fields. Return [`Error`] if the schemas have fields with the
+/// same field id but different types.
+fn join_schemas(left: &Schema, right: &Schema) -> Result<Schema> {
+    let mut joined_fields: Vec<NestedFieldRef> = left.as_struct().fields().to_vec();
+
+    for right_field in right.as_struct().fields() {
+        match left.field_by_id(right_field.id) {
+            None => {
+                joined_fields.push(right_field.clone());
+            }
+            Some(left_field) => {
+                if left_field != right_field {
+                    return Err(Error::new(
+                        ErrorKind::DataInvalid,
+                        format!(
+                            "Schemas have different columns with the same id: {:?}, {:?}",
+                            left_field, right_field
+                        ),
+                    ));
+                }
+            }
         }
     }
-}
 
-struct ReadableMetricsStructBuilder<'a> {
-    table_schema: &'a SchemaRef,
-    column_builders: Vec<PerColumnReadableMetricsBuilder>,
+    Schema::builder().with_fields(joined_fields).build()
 }
 
-impl<'a> ReadableMetricsStructBuilder<'a> {
-    /// Helper to construct per-column readable metrics. The metrics are "readable" in that the reported
-    /// and lower and upper bounds are reported as deserialized values.
-    fn fields(table_schema: &SchemaRef) -> Result<Fields> {
-        let arrow_schema = schema_to_arrow_schema(table_schema)?;
-
-        Ok(arrow_schema
-            .fields()
-            .iter()
-            .map(|field| {
-                Field::new(
-                    field.name(),
-                    DataType::Struct(PerColumnReadableMetricsBuilder::fields(field.data_type())),
-                    false,
-                )
-            })
-            .collect_vec()
-            .into())
-    }
+/// Helper to cast a field builder in a [`StructBuilder`] to a specific builder type or return an
+/// [`Error`].
+trait StructBuilderExt {
+    fn field_builder_or_err<T: ArrayBuilder>(&mut self, index: usize) -> Result<&mut T>;
+}
 
-    fn new(table_schema: &'a SchemaRef) -> Result<ReadableMetricsStructBuilder> {
-        Ok(Self {
-            table_schema,
-            column_builders: table_schema
-                .as_struct()
-                .fields()
-                .iter()
-                .map(|field| {
-                    type_to_arrow_type(&field.field_type).map(|arrow_type| {
-                        PerColumnReadableMetricsBuilder::new_for_field(field.id, &arrow_type)
-                    })
-                })
-                .collect::<Result<Vec<_>>>()?,
+impl StructBuilderExt for StructBuilder {
+    fn field_builder_or_err<T: ArrayBuilder>(&mut self, index: usize) -> Result<&mut T> {
+        self.field_builder::<T>(index).ok_or_else(|| {
+            Error::new(
+                ErrorKind::Unexpected,
+                format!(
+                    "Field builder not found for index {index} and type {}",
+                    type_name::<T>()
+                ),
+            )
         })
     }
+}
 
-    fn append(&mut self, data_file: &DataFile) -> Result<()> {
-        for column_builder in &mut self.column_builders {
-            column_builder.append(data_file)?;
-        }
-        Ok(())
-    }
+/// Helper to cast a [`Box<dyn ArrayBuilder>`] to a specific type or return an [`Error`].
+trait ArrayBuilderExt {
+    fn cast_or_err<T: ArrayBuilder>(&mut self) -> Result<&mut T>;
+}
 
-    fn finish(&mut self) -> StructArray {
-        let fields: Vec<FieldRef> = Self::fields(self.table_schema)
-            // We already checked the schema conversion in the constructor
-            .unwrap()
-            .into_iter()
-            .cloned()
-            .collect();
-        let arrays: Vec<ArrayRef> = self
-            .column_builders
-            .iter_mut()
-            .map::<ArrayRef, _>(|builder| Arc::new(builder.finish()))
-            .collect();
-        StructArray::from(
-            fields
-                .into_iter()
-                .zip_eq(arrays)
-                .collect::<Vec<(FieldRef, ArrayRef)>>(),
-        )
+impl ArrayBuilderExt for Box<dyn ArrayBuilder> {
+    fn cast_or_err<T: ArrayBuilder>(&mut self) -> Result<&mut T> {
+        self.as_any_mut().downcast_mut::<T>().ok_or_else(|| {
+            Error::new(
+                ErrorKind::Unexpected,
+                format!("Cannot cast builder to type {}", type_name::<T>()),
+            )
+        })
     }
 }
 
@@ -643,29 +572,32 @@ mod tests {
         let mut fixture = TableTestFixture::new();
         fixture.setup_manifest_files().await;
         let table = fixture.table;
+        let inspect = table.inspect();
+        let entries_table = inspect.entries();
 
-        let batch_stream = table.inspect().entries().scan().await.unwrap();
+        let batch_stream = entries_table.scan().await.unwrap();
 
         check_record_batches(
             batch_stream,
             expect![[r#"
-                Field { name: "status", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} },
-                Field { name: "snapshot_id", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} },
-                Field { name: "sequence_number", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} },
-                Field { name: "file_sequence_number", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} },
-                Field { name: "data_file", data_type: Struct([Field { name: "content", data_type: Int8, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "file_path", data_type: Utf8, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "file_format", data_type: Utf8, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "partition", data_type: Struct([Field { name: "x", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "record_count", data_type: Int64, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "file_size_in_bytes", data_type: Int64, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "column_sizes", data_type: Map(Field { name: "entries", data_type: Struct([Field { name: "keys", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "values", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, false), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_counts", data_type: Map(Field { name: "entries", data_type: Struct([Field { name: "keys", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "values", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, false), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_counts", data_type: Map(Field { name: "entries", data_type: Struct([Field { name: "keys", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "values", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, false), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_counts", data_type: Map(Field { name: "entries", data_type: Struct([Field { name: "keys", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "values", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, false), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bounds", data_type: Map(Field { name: "entries", data_type: Struct([Field { name: "keys", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "values", data_type: Binary, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, false), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bounds", data_type: Map(Field { name: "entries", data_type: Struct([Field { name: "keys", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "values", data_type: Binary, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, false), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "key_metadata", data_type: Binary, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "split_offsets", data_type: List(Field { name: "item", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "equality_ids", data_type: List(Field { name: "item", data_type: Int32, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "sort_order_id", data_type: Int32, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} },
-                Field { name: "readable_metrics", data_type: Struct([Field { name: "x", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "y", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "z", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "a", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Utf8, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Utf8, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "dbl", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Float64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Float64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "i32", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Int32, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Int32, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "i64", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "bool", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Boolean, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Boolean, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "float", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Float32, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Float32, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "decimal", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Decimal128(3, 2), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Decimal128(3, 2), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "date", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Date32, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Date32, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "timestamp", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Timestamp(Microsecond, None), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Timestamp(Microsecond, None), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "timestamptz", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Timestamp(Microsecond, Some("+00:00")), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Timestamp(Microsecond, Some("+00:00")), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "timestampns", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Timestamp(Nanosecond, None), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Timestamp(Nanosecond, None), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "timestamptzns", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: Timestamp(Nanosecond, Some("+00:00")), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: Timestamp(Nanosecond, Some("+00:00")), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "binary", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "lower_bound", data_type: LargeBinary, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }, Field { name: "upper_bound", data_type: LargeBinary, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }"#]],
+                Field { name: "status", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "0"} },
+                Field { name: "snapshot_id", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1"} },
+                Field { name: "sequence_number", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "3"} },
+                Field { name: "file_sequence_number", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "4"} },
+                Field { name: "data_file", data_type: Struct([Field { name: "content", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "134"} }, Field { name: "file_path", data_type: Utf8, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "100"} }, Field { name: "file_format", data_type: Utf8, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "101"} }, Field { name: "partition", data_type: Struct([Field { name: "x", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1000"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "102"} }, Field { name: "record_count", data_type: Int64, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "103"} }, Field { name: "file_size_in_bytes", data_type: Int64, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "104"} }, Field { name: "column_sizes", data_type: Map(Field { name: "key_value", data_type: Struct([Field { name: "key", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "117"} }, Field { name: "value", data_type: Int64, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "118"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, false), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "108"} }, Field { name: "value_counts", data_type: Map(Field { name: "key_value", data_type: Struct([Field { name: "key", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "119"} }, Field { name: "value", data_type: Int64, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "120"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, false), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "109"} }, Field { name: "null_value_counts", data_type: Map(Field { name: "key_value", data_type: Struct([Field { name: "key", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "121"} }, Field { name: "value", data_type: Int64, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "122"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, false), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "110"} }, Field { name: "nan_value_counts", data_type: Map(Field { name: "key_value", data_type: Struct([Field { name: "key", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "138"} }, Field { name: "value", data_type: Int64, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "139"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, false), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "137"} }, Field { name: "lower_bounds", data_type: Map(Field { name: "key_value", data_type: Struct([Field { name: "key", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "126"} }, Field { name: "value", data_type: LargeBinary, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "127"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, false), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "125"} }, Field { name: "upper_bounds", data_type: Map(Field { name: "key_value", data_type: Struct([Field { name: "key", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "129"} }, Field { name: "value", data_type: LargeBinary, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "130"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {} }, false), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "128"} }, Field { name: "key_metadata", data_type: LargeBinary, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "131"} }, Field { name: "split_offsets", data_type: List(Field { name: "element", data_type: Int64, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "133"} }), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "132"} }, Field { name: "equality_ids", data_type: List(Field { name: "element", data_type: Int32, nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "136"} }), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "135"} }, Field { name: "sort_order_id", data_type: Int32, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "140"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "2"} },
+                Field { name: "readable_metrics", data_type: Struct([Field { name: "a", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1001"} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1002"} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1003"} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1004"} }, Field { name: "lower_bound", data_type: Utf8, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1005"} }, Field { name: "upper_bound", data_type: Utf8, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1006"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1007"} }, Field { name: "binary", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1008"} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1009"} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1010"} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1011"} }, Field { name: "lower_bound", data_type: LargeBinary, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1012"} }, Field { name: "upper_bound", data_type: LargeBinary, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1013"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1014"} }, Field { name: "bool", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1015"} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1016"} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1017"} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1018"} }, Field { name: "lower_bound", data_type: Boolean, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1019"} }, Field { name: "upper_bound", data_type: Boolean, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1020"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1021"} }, Field { name: "date", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1022"} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1023"} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1024"} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1025"} }, Field { name: "lower_bound", data_type: Date32, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1026"} }, Field { name: "upper_bound", data_type: Date32, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1027"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1028"} }, Field { name: "dbl", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1029"} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1030"} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1031"} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1032"} }, Field { name: "lower_bound", data_type: Float64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1033"} }, Field { name: "upper_bound", data_type: Float64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1034"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1035"} }, Field { name: "decimal", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1036"} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1037"} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1038"} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1039"} }, Field { name: "lower_bound", data_type: Decimal128(3, 2), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1040"} }, Field { name: "upper_bound", data_type: Decimal128(3, 2), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1041"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1042"} }, Field { name: "float", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1043"} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1044"} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1045"} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1046"} }, Field { name: "lower_bound", data_type: Float32, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1047"} }, Field { name: "upper_bound", data_type: Float32, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1048"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1049"} }, Field { name: "i32", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1050"} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1051"} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1052"} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1053"} }, Field { name: "lower_bound", data_type: Int32, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1054"} }, Field { name: "upper_bound", data_type: Int32, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1055"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1056"} }, Field { name: "i64", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1057"} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1058"} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1059"} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1060"} }, Field { name: "lower_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1061"} }, Field { name: "upper_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1062"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1063"} }, Field { name: "timestamp", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1064"} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1065"} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1066"} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1067"} }, Field { name: "lower_bound", data_type: Timestamp(Microsecond, None), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1068"} }, Field { name: "upper_bound", data_type: Timestamp(Microsecond, None), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1069"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1070"} }, Field { name: "timestampns", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1071"} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1072"} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1073"} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1074"} }, Field { name: "lower_bound", data_type: Timestamp(Nanosecond, None), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1075"} }, Field { name: "upper_bound", data_type: Timestamp(Nanosecond, None), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1076"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1077"} }, Field { name: "timestamptz", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1078"} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1079"} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1080"} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1081"} }, Field { name: "lower_bound", data_type: Timestamp(Microsecond, Some("+00:00")), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1082"} }, Field { name: "upper_bound", data_type: Timestamp(Microsecond, Some("+00:00")), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1083"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1084"} }, Field { name: "timestamptzns", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1085"} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1086"} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1087"} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1088"} }, Field { name: "lower_bound", data_type: Timestamp(Nanosecond, Some("+00:00")), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1089"} }, Field { name: "upper_bound", data_type: Timestamp(Nanosecond, Some("+00:00")), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1090"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1091"} }, Field { name: "x", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1092"} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1093"} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1094"} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1095"} }, Field { name: "lower_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1096"} }, Field { name: "upper_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1097"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1098"} }, Field { name: "y", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1099"} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1100"} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1101"} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1102"} }, Field { name: "lower_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1103"} }, Field { name: "upper_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1104"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1105"} }, Field { name: "z", data_type: Struct([Field { name: "column_size", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1106"} }, Field { name: "value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1107"} }, Field { name: "null_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1108"} }, Field { name: "nan_value_count", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1109"} }, Field { name: "lower_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1110"} }, Field { name: "upper_bound", data_type: Int64, nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1111"} }]), nullable: false, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1112"} }]), nullable: true, dict_id: 0, dict_is_ordered: false, metadata: {"PARQUET:field_id": "1113"} }"#]],
             expect![[r#"
                 +--------+---------------------+-----------------+----------------------+------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------+---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------+
                 | status | snapshot_id         | sequence_number | file_sequence_number | data_file                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    | readable_metrics                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
                 +--------+---------------------+-----------------+----------------------+------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------+---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------+
-                | 1      | 3055729675574597004 | 1               | 1                    | {content: 0, file_format: PARQUET, partition: {x: 100}, record_count: 1, file_size_in_bytes: 100, column_sizes: {1: 1, 2: 1}, value_counts: {1: 2, 2: 2}, null_value_counts: {1: 3, 2: 3}, nan_value_counts: {1: 4, 2: 4}, lower_bounds: {1: 0100000000000000, 2: 0200000000000000, 3: 0300000000000000, 4: 417061636865, 5: 0000000000005940, 6: 64000000, 7: 6400000000000000, 8: 00, 9: 0000c842, 11: 00000000, 12: 0000000000000000, 13: 0000000000000000}, upper_bounds: {1: 0100000000000000, 2: 0500000000000000, 3: 0400000000000000, 4: 49636562657267, 5: 0000000000006940, 6: c8000000, 7: c800000000000000, 8: 01, 9: 00004843, 11: 00000000, 12: 0000000000000000, 13: 0000000000000000}, key_metadata: , split_offsets: [], equality_ids: [], sort_order_id: } | {x: {column_size: 1, value_count: 2, null_value_count: 3, nan_value_count: 4, lower_bound: 1, upper_bound: 1}, y: {column_size: 1, value_count: 2, null_value_count: 3, nan_value_count: 4, lower_bound: 2, upper_bound: 5}, z: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 3, upper_bound: 4}, a: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: Apache, upper_bound: Iceberg}, dbl: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 100.0, upper_bound: 200.0}, i32: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 100, upper_bound: 200}, i64: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 100, upper_bound: 200}, bool: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: false, upper_bound: true}, float: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 100.0, upper_bound: 200.0}, decimal: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, date: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 1970-01-01, upper_bound: 1970-01-01}, timestamp: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 1970-01-01T00:00:00, upper_bound: 1970-01-01T00:00:00}, timestamptz: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 1970-01-01T00:00:00Z, upper_bound: 1970-01-01T00:00:00Z}, timestampns: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestamptzns: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, binary: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }} |
-                | 2      | 3055729675574597004 | 0               | 0                    | {content: 0, file_format: PARQUET, partition: {x: 200}, record_count: 1, file_size_in_bytes: 100, column_sizes: {}, value_counts: {}, null_value_counts: {}, nan_value_counts: {}, lower_bounds: {}, upper_bounds: {}, key_metadata: , split_offsets: [], equality_ids: [], sort_order_id: }                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | {x: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, y: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, z: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, a: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, dbl: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, i32: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, i64: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, bool: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, float: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, decimal: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, date: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestamp: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestamptz: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestampns: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestamptzns: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, binary: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }}                                                                                                                                                                       |
-                | 0      | 3051729675574597004 | 0               | 0                    | {content: 0, file_format: PARQUET, partition: {x: 300}, record_count: 1, file_size_in_bytes: 100, column_sizes: {}, value_counts: {}, null_value_counts: {}, nan_value_counts: {}, lower_bounds: {}, upper_bounds: {}, key_metadata: , split_offsets: [], equality_ids: [], sort_order_id: }                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | {x: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, y: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, z: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, a: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, dbl: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, i32: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, i64: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, bool: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, float: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, decimal: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, date: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestamp: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestamptz: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestampns: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestamptzns: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, binary: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }}                                                                                                                                                                       |
+                | 1      | 3055729675574597004 | 1               | 1                    | {content: 0, file_format: PARQUET, partition: {x: 100}, record_count: 1, file_size_in_bytes: 100, column_sizes: {1: 1, 2: 1}, value_counts: {1: 2, 2: 2}, null_value_counts: {1: 3, 2: 3}, nan_value_counts: {1: 4, 2: 4}, lower_bounds: {1: 0100000000000000, 2: 0200000000000000, 3: 0300000000000000, 4: 417061636865, 5: 0000000000005940, 6: 64000000, 7: 6400000000000000, 8: 00, 9: 0000c842, 11: 00000000, 12: 0000000000000000, 13: 0000000000000000}, upper_bounds: {1: 0100000000000000, 2: 0500000000000000, 3: 0400000000000000, 4: 49636562657267, 5: 0000000000006940, 6: c8000000, 7: c800000000000000, 8: 01, 9: 00004843, 11: 00000000, 12: 0000000000000000, 13: 0000000000000000}, key_metadata: , split_offsets: [], equality_ids: [], sort_order_id: } | {a: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: Apache, upper_bound: Iceberg}, binary: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, bool: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: false, upper_bound: true}, date: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 1970-01-01, upper_bound: 1970-01-01}, dbl: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 100.0, upper_bound: 200.0}, decimal: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, float: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 100.0, upper_bound: 200.0}, i32: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 100, upper_bound: 200}, i64: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 100, upper_bound: 200}, timestamp: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 1970-01-01T00:00:00, upper_bound: 1970-01-01T00:00:00}, timestampns: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestamptz: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 1970-01-01T00:00:00Z, upper_bound: 1970-01-01T00:00:00Z}, timestamptzns: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, x: {column_size: 1, value_count: 2, null_value_count: 3, nan_value_count: 4, lower_bound: 1, upper_bound: 1}, y: {column_size: 1, value_count: 2, null_value_count: 3, nan_value_count: 4, lower_bound: 2, upper_bound: 5}, z: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: 3, upper_bound: 4}} |
+                | 2      | 3055729675574597004 | 0               | 0                    | {content: 0, file_format: PARQUET, partition: {x: 200}, record_count: 1, file_size_in_bytes: 100, column_sizes: {}, value_counts: {}, null_value_counts: {}, nan_value_counts: {}, lower_bounds: {}, upper_bounds: {}, key_metadata: , split_offsets: [], equality_ids: [], sort_order_id: }                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | {a: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, binary: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, bool: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, date: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, dbl: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, decimal: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, float: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, i32: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, i64: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestamp: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestampns: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestamptz: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestamptzns: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, x: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, y: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, z: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }}                                                                                                                                                                       |
+                | 0      | 3051729675574597004 | 0               | 0                    | {content: 0, file_format: PARQUET, partition: {x: 300}, record_count: 1, file_size_in_bytes: 100, column_sizes: {}, value_counts: {}, null_value_counts: {}, nan_value_counts: {}, lower_bounds: {}, upper_bounds: {}, key_metadata: , split_offsets: [], equality_ids: [], sort_order_id: }                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | {a: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, binary: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, bool: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, date: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, dbl: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, decimal: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, float: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, i32: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, i64: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestamp: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestampns: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestamptz: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, timestamptzns: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, x: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, y: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }, z: {column_size: , value_count: , null_value_count: , nan_value_count: , lower_bound: , upper_bound: }}                                                                                                                                                                       |
                 +--------+---------------------+-----------------+----------------------+------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------+---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------+"#]],
             &[],
             &["file_path"],
             None,
-        ).await;
+        )
+            .await;
     }
 }
diff --git a/crates/iceberg/src/inspect/metadata_table.rs b/crates/iceberg/src/inspect/metadata_table.rs
index 3ea029cf3..20d75caa9 100644
--- a/crates/iceberg/src/inspect/metadata_table.rs
+++ b/crates/iceberg/src/inspect/metadata_table.rs
@@ -56,7 +56,7 @@ pub mod tests {
 
     use arrow_array::{ArrayRef, RecordBatch, StructArray};
     use arrow_cast::pretty::pretty_format_batches;
-    use arrow_schema::{DataType, Field, FieldRef, Schema};
+    use arrow_schema::{DataType, Field, FieldRef, Schema as ArrowSchema};
     use expect_test::Expect;
     use futures::TryStreamExt;
     use itertools::Itertools;
@@ -133,9 +133,11 @@ pub mod tests {
             record_batch.schema().fields().iter().format(",\n")
         ));
         expected_data.assert_eq(
-            &pretty_format_batches(&[
-                RecordBatch::try_new(Arc::new(Schema::new(fields)), columns).unwrap()
-            ])
+            &pretty_format_batches(&[RecordBatch::try_new(
+                Arc::new(ArrowSchema::new(fields)),
+                columns,
+            )
+            .unwrap()])
             .unwrap()
             .to_string(),
         );
diff --git a/crates/iceberg/src/inspect/metrics.rs b/crates/iceberg/src/inspect/metrics.rs
new file mode 100644
index 000000000..ee0d37378
--- /dev/null
+++ b/crates/iceberg/src/inspect/metrics.rs
@@ -0,0 +1,428 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use std::any::type_name;
+use std::sync::Arc;
+
+use arrow_array::builder::{
+    ArrayBuilder, BooleanBuilder, Date32Builder, Decimal128Builder, FixedSizeBinaryBuilder,
+    Float32Builder, Float64Builder, Int32Builder, Int64Builder, LargeBinaryBuilder, StringBuilder,
+    StructBuilder, TimestampMicrosecondBuilder, TimestampNanosecondBuilder,
+};
+use arrow_array::cast::AsArray;
+use arrow_array::types::{
+    Date32Type, Decimal128Type, Float32Type, Float64Type, Int32Type, Int64Type,
+    TimestampMicrosecondType, TimestampNanosecondType,
+};
+use arrow_array::{ArrayRef, StructArray};
+use arrow_schema::{DataType, FieldRef, Fields};
+use itertools::Itertools;
+use rust_decimal::prelude::ToPrimitive;
+
+use crate::arrow::{get_arrow_datum, schema_to_arrow_schema, type_to_arrow_type};
+use crate::spec::{
+    DataFile, Datum, NestedField, NestedFieldRef, PrimitiveType, Schema, StructType, Type,
+};
+use crate::{Error, ErrorKind, Result};
+
+/// Metrics for a column in a data file.
+struct ColumnMetrics {
+    column_size: Option<i64>,
+    value_count: Option<i64>,
+    null_value_count: Option<i64>,
+    nan_value_count: Option<i64>,
+    lower_bound: Option<Datum>,
+    upper_bound: Option<Datum>,
+}
+
+/// Builder for the `readable_metrics` struct in metadata tables.
+pub(crate) struct ReadableMetricsStructBuilder {
+    column_builders: Vec<ReadableColumnMetricsStructBuilder>,
+    column_fields: Fields,
+}
+
+impl ReadableMetricsStructBuilder {
+    /// Calculates a dynamic schema for `readable_metrics` to add to metadata tables. The type
+    /// will be a nested struct containing all primitive columns in the data table. Within the
+    /// struct's fields are structs that represent [`ColumnMetrics`].
+    ///
+    ///
+    /// We take the table's schema to get the set of fields in the table. We also take the manifest
+    /// entry schema to get the highest field ID in the entries metadata table to know which field
+    /// ID to begin with.
+    pub fn readable_metrics_schema(
+        data_table_schema: &Schema,
+        manifest_entry_schema: &Schema,
+    ) -> Result<Schema> {
+        let mut field_ids = IncrementingFieldId(manifest_entry_schema.highest_field_id() + 1);
+        let mut column_metrics_fields: Vec<NestedFieldRef> = Vec::new();
+
+        let mut primitive_fields: Vec<&NestedFieldRef> = data_table_schema
+            .as_struct()
+            .fields()
+            .iter()
+            .filter(|field| field.field_type.is_primitive())
+            .collect_vec();
+        primitive_fields.sort_by_key(|field| field.name.clone());
+
+        for field in primitive_fields {
+            // We can expect a primitive type because we filtered for primitive fields above
+            let primitive_type = field.field_type.as_primitive_type().expect("is primitive");
+            let metrics_schema_for_field =
+                ReadableColumnMetricsStructBuilder::schema(&mut field_ids, primitive_type)?;
+
+            column_metrics_fields.push(Arc::new(NestedField::required(
+                field_ids.next_id(),
+                &field.name,
+                Type::Struct(metrics_schema_for_field.as_struct().clone()),
+            )));
+        }
+
+        Schema::builder()
+            .with_fields(vec![Arc::new(NestedField::optional(
+                field_ids.next_id(),
+                "readable_metrics",
+                Type::Struct(StructType::new(column_metrics_fields)),
+            ))])
+            .build()
+    }
+
+    /// Takes a table schema and a readable metrics schema built by
+    /// [`Self::readable_metrics_schema`].
+    pub fn new(
+        data_table_schema: &Schema,
+        readable_metrics_schema: &StructType,
+    ) -> Result<ReadableMetricsStructBuilder> {
+        let DataType::Struct(column_fields) =
+            type_to_arrow_type(&Type::Struct(readable_metrics_schema.clone()))?
+        else {
+            return Err(Error::new(
+                ErrorKind::Unexpected,
+                "Converted Arrow type was not struct",
+            ));
+        };
+
+        let column_builders = readable_metrics_schema
+            .fields()
+            .iter()
+            .map(|column_metrics_field| {
+                let fields = column_metrics_field
+                    .field_type
+                    .clone()
+                    .to_struct_type()
+                    .ok_or_else(|| Error::new(ErrorKind::DataInvalid, "Expected struct type"))?
+                    .fields()
+                    .iter()
+                    .cloned()
+                    .collect_vec();
+                let column_metrics_schema = Schema::builder().with_fields(fields).build()?;
+                let data_field = data_table_schema
+                    .field_by_name(&column_metrics_field.name)
+                    .ok_or_else(|| {
+                        Error::new(
+                            ErrorKind::DataInvalid,
+                            format!(
+                                "{} in readable metrics schema does not exist in table",
+                                &column_metrics_field.name
+                            ),
+                        )
+                    })?;
+                let primitive_type = data_field
+                    .field_type
+                    .as_primitive_type()
+                    .ok_or_else(|| {
+                        Error::new(
+                            ErrorKind::FeatureUnsupported,
+                            "Readable metrics only supported for primitive types",
+                        )
+                    })?
+                    .clone();
+
+                ReadableColumnMetricsStructBuilder::new(
+                    data_field.id,
+                    primitive_type,
+                    column_metrics_schema,
+                )
+            })
+            .collect::<Result<Vec<_>>>()?;
+
+        Ok(Self {
+            column_fields,
+            column_builders,
+        })
+    }
+
+    pub fn append(&mut self, data_file: &DataFile) -> Result<()> {
+        for column_builder in &mut self.column_builders {
+            column_builder.append_data_file(data_file)?;
+        }
+        Ok(())
+    }
+
+    pub fn finish(&mut self) -> StructArray {
+        let arrays: Vec<ArrayRef> = self
+            .column_builders
+            .iter_mut()
+            .map::<ArrayRef, _>(|builder| Arc::new(builder.finish()))
+            .collect();
+
+        let inner_arrays: Vec<(FieldRef, ArrayRef)> = self
+            .column_fields
+            .into_iter()
+            .cloned()
+            .zip_eq(arrays)
+            .collect_vec();
+
+        StructArray::from(inner_arrays)
+    }
+}
+
+struct ReadableColumnMetricsStructBuilder {
+    /// Field id of the column in the data table.
+    field_id: i32,
+    /// Type of the column in the data table for which these are the metrics.
+    primitive_type: PrimitiveType,
+    /// The struct builder for this column's readable metrics.
+    struct_builder: StructBuilder,
+}
+
+/// Builds a readable metrics struct for a single column.
+///
+/// For reference, see [Java][1] and [Python][2] implementations.
+///
+/// [1]: https://github.com/apache/iceberg/blob/4a432839233f2343a9eae8255532f911f06358ef/core/src/main/java/org/apache/iceberg/MetricsUtil.java#L337
+/// [2]: https://github.com/apache/iceberg-python/blob/a051584a3684392d2db6556449eb299145d47d15/pyiceberg/table/inspect.py#L101-L110
+impl ReadableColumnMetricsStructBuilder {
+    /// Return the readable metrics schema for a column of the given data type.
+    fn schema(field_ids: &mut IncrementingFieldId, data_type: &PrimitiveType) -> Result<Schema> {
+        Schema::builder()
+            .with_fields(vec![
+                Arc::new(NestedField::optional(
+                    field_ids.next_id(),
+                    "column_size",
+                    Type::Primitive(PrimitiveType::Long),
+                )),
+                Arc::new(NestedField::optional(
+                    field_ids.next_id(),
+                    "value_count",
+                    Type::Primitive(PrimitiveType::Long),
+                )),
+                Arc::new(NestedField::optional(
+                    field_ids.next_id(),
+                    "null_value_count",
+                    Type::Primitive(PrimitiveType::Long),
+                )),
+                Arc::new(NestedField::optional(
+                    field_ids.next_id(),
+                    "nan_value_count",
+                    Type::Primitive(PrimitiveType::Long),
+                )),
+                Arc::new(NestedField::optional(
+                    field_ids.next_id(),
+                    "lower_bound",
+                    Type::Primitive(data_type.clone()),
+                )),
+                Arc::new(NestedField::optional(
+                    field_ids.next_id(),
+                    "upper_bound",
+                    Type::Primitive(data_type.clone()),
+                )),
+            ])
+            .build()
+    }
+
+    fn new(field_id: i32, primitive_type: PrimitiveType, schema: Schema) -> Result<Self> {
+        Ok(Self {
+            field_id,
+            primitive_type,
+            struct_builder: StructBuilder::from_fields(schema_to_arrow_schema(&schema)?.fields, 0),
+        })
+    }
+
+    fn append_data_file(&mut self, data_file: &DataFile) -> Result<()> {
+        let column_metrics = Self::get_column_metrics_from_data_file(&self.field_id, data_file);
+        self.append_column_metrics(column_metrics)
+    }
+
+    fn get_column_metrics_from_data_file(field_id: &i32, data_file: &DataFile) -> ColumnMetrics {
+        ColumnMetrics {
+            column_size: data_file.column_sizes().get(field_id).map(|&v| v as i64),
+            value_count: data_file.value_counts().get(field_id).map(|&v| v as i64),
+            null_value_count: data_file
+                .null_value_counts()
+                .get(field_id)
+                .map(|&v| v as i64),
+            nan_value_count: data_file
+                .nan_value_counts()
+                .get(field_id)
+                .map(|&v| v as i64),
+            lower_bound: data_file.lower_bounds().get(field_id).cloned(),
+            upper_bound: data_file.upper_bounds().get(field_id).cloned(),
+        }
+    }
+
+    fn append_column_metrics(&mut self, column_metrics: ColumnMetrics) -> Result<()> {
+        let ColumnMetrics {
+            column_size,
+            value_count,
+            null_value_count,
+            nan_value_count,
+            lower_bound,
+            upper_bound,
+        } = column_metrics;
+
+        self.field_builder::<Int64Builder>(0)
+            .append_option(column_size);
+        self.field_builder::<Int64Builder>(1)
+            .append_option(value_count);
+        self.field_builder::<Int64Builder>(2)
+            .append_option(null_value_count);
+        self.field_builder::<Int64Builder>(3)
+            .append_option(nan_value_count);
+        self.append_bounds(4, lower_bound)?;
+        self.append_bounds(5, upper_bound)?;
+        self.struct_builder.append(true);
+        Ok(())
+    }
+
+    fn append_bounds(&mut self, index: usize, datum: Option<Datum>) -> Result<()> {
+        let datum = datum.map(|datum| get_arrow_datum(&datum)).transpose()?;
+        let array = if let Some(datum) = &datum {
+            let (array, is_scalar) = datum.get();
+            if is_scalar {
+                Some(array)
+            } else {
+                return Err(Error::new(
+                    ErrorKind::Unexpected,
+                    "Can only append scalar datum",
+                ));
+            }
+        } else {
+            None
+        };
+
+        match self.primitive_type {
+            PrimitiveType::Boolean => {
+                self.field_builder::<BooleanBuilder>(index)
+                    .append_option(array.map(|array| array.as_boolean().value(0)));
+            }
+            PrimitiveType::Int => {
+                self.field_builder::<Int32Builder>(index)
+                    .append_option(array.map(|array| array.as_primitive::<Int32Type>().value(0)));
+            }
+            PrimitiveType::Long => {
+                self.field_builder::<Int64Builder>(index)
+                    .append_option(array.map(|array| array.as_primitive::<Int64Type>().value(0)));
+            }
+            PrimitiveType::Float => {
+                self.field_builder::<Float32Builder>(index)
+                    .append_option(array.map(|array| array.as_primitive::<Float32Type>().value(0)));
+            }
+            PrimitiveType::Double => {
+                self.field_builder::<Float64Builder>(index)
+                    .append_option(array.map(|array| array.as_primitive::<Float64Type>().value(0)));
+            }
+            PrimitiveType::Date => {
+                self.field_builder::<Date32Builder>(index)
+                    .append_option(array.map(|array| array.as_primitive::<Date32Type>().value(0)));
+            }
+            PrimitiveType::Time | PrimitiveType::Timestamp | PrimitiveType::Timestamptz => {
+                self.field_builder::<TimestampMicrosecondBuilder>(index)
+                    .append_option(
+                        array
+                            .map(|array| array.as_primitive::<TimestampMicrosecondType>().value(0)),
+                    );
+            }
+            PrimitiveType::TimestampNs | PrimitiveType::TimestamptzNs => {
+                self.field_builder::<TimestampNanosecondBuilder>(index)
+                    .append_option(
+                        array.map(|array| array.as_primitive::<TimestampNanosecondType>().value(0)),
+                    );
+            }
+            PrimitiveType::String => {
+                self.field_builder::<StringBuilder>(index)
+                    .append_option(array.map(|array| array.as_string::<i32>().value(0)));
+            }
+            PrimitiveType::Binary => {
+                self.field_builder::<LargeBinaryBuilder>(index)
+                    .append_option(array.map(|array| array.as_binary::<i64>().value(0)));
+            }
+            PrimitiveType::Decimal { .. } => {
+                self.field_builder::<Decimal128Builder>(index)
+                    .append_option(
+                        array.map(|array| array.as_primitive::<Decimal128Type>().value(0)),
+                    );
+            }
+            PrimitiveType::Fixed(len) => {
+                if len.to_i32().is_some() {
+                    let builder = self.field_builder::<FixedSizeBinaryBuilder>(index);
+                    // FixedSizeBinaryBuilder does not have append_option
+                    match array {
+                        Some(array) => {
+                            builder.append_value(array.as_fixed_size_binary().value(0))?;
+                        }
+                        None => {
+                            builder.append_null();
+                        }
+                    }
+                } else {
+                    self.field_builder::<LargeBinaryBuilder>(index)
+                        .append_option(array.map(|array| array.as_binary::<i64>().value(0)));
+                }
+            }
+            PrimitiveType::Uuid => {
+                let builder = self.field_builder::<FixedSizeBinaryBuilder>(index);
+                // FixedSizeBinaryBuilder does not have append_option
+                match array {
+                    Some(array) => {
+                        builder.append_value(array.as_fixed_size_binary().value(0))?;
+                    }
+                    None => {
+                        builder.append_null();
+                    }
+                }
+            }
+        };
+        Ok(())
+    }
+
+    fn finish(&mut self) -> StructArray {
+        self.struct_builder.finish()
+    }
+
+    // Shorthand to select a field builder with a specific type.
+    fn field_builder<T: ArrayBuilder>(&mut self, index: usize) -> &mut T {
+        match self.struct_builder.field_builder::<T>(index) {
+            Some(builder) => builder,
+            None => panic!(
+                "Field builder not found for index {index} and type {}",
+                type_name::<T>(),
+            ),
+        }
+    }
+}
+
+/// Helper to serve increment field ids.
+struct IncrementingFieldId(i32);
+
+impl IncrementingFieldId {
+    fn next_id(&mut self) -> i32 {
+        let current = self.0;
+        self.0 += 1;
+        current
+    }
+}
diff --git a/crates/iceberg/src/inspect/mod.rs b/crates/iceberg/src/inspect/mod.rs
index 02a57e664..5e3f15d56 100644
--- a/crates/iceberg/src/inspect/mod.rs
+++ b/crates/iceberg/src/inspect/mod.rs
@@ -20,6 +20,7 @@
 mod entries;
 mod manifests;
 mod metadata_table;
+mod metrics;
 mod snapshots;
 
 pub use entries::EntriesTable;
diff --git a/crates/iceberg/src/spec/manifest.rs b/crates/iceberg/src/spec/manifest.rs
index b47591e88..4f5f5e299 100644
--- a/crates/iceberg/src/spec/manifest.rs
+++ b/crates/iceberg/src/spec/manifest.rs
@@ -561,7 +561,7 @@ impl ManifestWriter {
 }
 
 /// This is a helper module that defines the schema field of the manifest list entry.
-mod _const_schema {
+pub(crate) mod _const_schema {
     use std::sync::Arc;
 
     use apache_avro::Schema as AvroSchema;
@@ -862,7 +862,7 @@ mod _const_schema {
         })
     };
 
-    fn data_file_fields_v2(partition_type: &StructType) -> Vec<NestedFieldRef> {
+    pub(crate) fn data_file_fields_v2(partition_type: &StructType) -> Vec<NestedFieldRef> {
         vec![
             CONTENT.clone(),
             FILE_PATH.clone(),
@@ -894,8 +894,8 @@ mod _const_schema {
         schema_to_avro_schema("data_file", &schema)
     }
 
-    pub(super) fn manifest_schema_v2(partition_type: &StructType) -> Result<AvroSchema, Error> {
-        let fields = vec![
+    pub(crate) fn manifest_schema_fields_v2(partition_type: &StructType) -> Vec<NestedFieldRef> {
+        vec![
             STATUS.clone(),
             SNAPSHOT_ID_V2.clone(),
             SEQUENCE_NUMBER.clone(),
@@ -905,8 +905,13 @@ mod _const_schema {
                 "data_file",
                 Type::Struct(StructType::new(data_file_fields_v2(partition_type))),
             )),
-        ];
-        let schema = Schema::builder().with_fields(fields).build()?;
+        ]
+    }
+
+    pub(super) fn manifest_schema_v2(partition_type: &StructType) -> Result<AvroSchema, Error> {
+        let schema = Schema::builder()
+            .with_fields(manifest_schema_fields_v2(partition_type))
+            .build()?;
         schema_to_avro_schema("manifest_entry", &schema)
     }
 
@@ -941,8 +946,8 @@ mod _const_schema {
         schema_to_avro_schema("data_file", &schema)
     }
 
-    pub(super) fn manifest_schema_v1(partition_type: &StructType) -> Result<AvroSchema, Error> {
-        let fields = vec![
+    fn manifest_schema_fields_v1(partition_type: &StructType) -> Vec<NestedFieldRef> {
+        vec![
             STATUS.clone(),
             SNAPSHOT_ID_V1.clone(),
             Arc::new(NestedField::required(
@@ -950,8 +955,13 @@ mod _const_schema {
                 "data_file",
                 Type::Struct(StructType::new(data_file_fields_v1(partition_type))),
             )),
-        ];
-        let schema = Schema::builder().with_fields(fields).build()?;
+        ]
+    }
+
+    pub(super) fn manifest_schema_v1(partition_type: &StructType) -> Result<AvroSchema, Error> {
+        let schema = Schema::builder()
+            .with_fields(manifest_schema_fields_v1(partition_type))
+            .build()?;
         schema_to_avro_schema("manifest_entry", &schema)
     }
 }
diff --git a/crates/iceberg/src/spec/partition.rs b/crates/iceberg/src/spec/partition.rs
index e6405be4c..b2c7fdd50 100644
--- a/crates/iceberg/src/spec/partition.rs
+++ b/crates/iceberg/src/spec/partition.rs
@@ -18,13 +18,16 @@
 /*!
  * Partitioning
  */
+
+use std::collections::{HashMap, HashSet};
 use std::sync::Arc;
 
+use itertools::Itertools;
 use serde::{Deserialize, Serialize};
 use typed_builder::TypedBuilder;
 
 use super::transform::Transform;
-use super::{NestedField, Schema, SchemaRef, StructType};
+use super::{NestedField, Schema, SchemaRef, StructType, TableMetadata, Type};
 use crate::{Error, ErrorKind, Result};
 
 pub(crate) const UNPARTITIONED_LAST_ASSIGNED_ID: i32 = 999;
@@ -616,12 +619,12 @@ trait CorePartitionSpecValidator {
 
         if let Some(collision) = collision {
             Err(Error::new(
-                    ErrorKind::DataInvalid,
-                    format!(
-                        "Cannot add redundant partition with source id `{}` and transform `{}`. A partition with the same source id and transform already exists with name `{}`",
-                        source_id, transform.dedup_name(), collision.name
-                    ),
-                ))
+                ErrorKind::DataInvalid,
+                format!(
+                    "Cannot add redundant partition with source id `{}` and transform `{}`. A partition with the same source id and transform already exists with name `{}`",
+                    source_id, transform.dedup_name(), collision.name
+                ),
+            ))
         } else {
             Ok(())
         }
@@ -657,10 +660,130 @@ impl CorePartitionSpecValidator for UnboundPartitionSpecBuilder {
     }
 }
 
+/// Builds a unified partition type considering all specs in the table.
+///
+/// Based on Iceberg Java's [`Partitioning#partitionType`][1].
+///
+/// [1]: https://github.com/apache/iceberg/blob/7e0cd3fa1e51d3c80f6c8cff23a03dca86f942fa/core/src/main/java/org/apache/iceberg/Partitioning.java#L240
+pub(crate) fn partition_type(table_metadata: &TableMetadata) -> Result<StructType> {
+    let partition_spec = table_metadata.partition_specs_iter().cloned().collect_vec();
+    let all_field_ids = all_field_ids(&partition_spec);
+
+    build_partition_projection_type(
+        table_metadata.current_schema(),
+        partition_spec,
+        all_field_ids,
+    )
+}
+
+// Based on Iceberg Java's [`Partitioning#buildPartitionProjectionType`][1].
+//
+// [1]:https://github.com/apache/iceberg/blob/apache-iceberg-1.8.0/core/src/main/java/org/apache/iceberg/Partitioning.java#L255
+fn build_partition_projection_type(
+    schema: &Schema,
+    specs: Vec<PartitionSpecRef>,
+    projected_field_ids: HashSet<i32>,
+) -> Result<StructType> {
+    // Check for unknown transforms because we cannot know the output type
+    for spec in &specs {
+        for field in &spec.fields {
+            if field.transform == Transform::Unknown {
+                return Err(Error::new(
+                    ErrorKind::DataInvalid,
+                    format!("Unknown transform in partition spec: {field:?}",),
+                ));
+            }
+        }
+    }
+
+    let mut field_map: HashMap<i32, PartitionField> = HashMap::new();
+    let mut type_map: HashMap<i32, Type> = HashMap::new();
+    let mut name_map: HashMap<i32, String> = HashMap::new();
+
+    // Sort specs by ID in descending order to get latest field names
+    let sorted_specs = specs
+        .iter()
+        .sorted_by_key(|spec| spec.spec_id())
+        .rev()
+        .collect_vec();
+
+    for spec in sorted_specs {
+        for field in spec.fields() {
+            let field_id = field.field_id;
+
+            if !projected_field_ids.contains(&field_id) {
+                continue;
+            }
+
+            let partition_type = spec.partition_type(schema)?;
+            let struct_field = partition_type.field_by_id(field_id).unwrap();
+            let existing_field = field_map.get(&field_id);
+
+            match existing_field {
+                None => {
+                    field_map.insert(field_id, field.clone());
+                    type_map.insert(field_id, struct_field.field_type.as_ref().clone());
+                    name_map.insert(field_id, struct_field.name.clone());
+                }
+                Some(existing_field) => {
+                    // verify the fields are compatible as they may conflict in v1 tables
+                    if !equivalent_ignoring_name(existing_field, field) {
+                        return Err(Error::new(
+                            ErrorKind::DataInvalid,
+                            format!(
+                                "Conflicting partition fields: ['{existing_field:?}', '{field:?}']",
+                            ),
+                        ));
+                    }
+
+                    // use the correct type for dropped partitions in v1 tables
+                    if is_void_transform(existing_field) && !is_void_transform(field) {
+                        field_map.insert(field_id, field.clone());
+                        type_map.insert(field_id, struct_field.field_type.as_ref().clone());
+                    }
+                }
+            }
+        }
+    }
+
+    let sorted_struct_fields = field_map
+        .into_keys()
+        .sorted()
+        .map(|field_id| {
+            NestedField::optional(field_id, &name_map[&field_id], type_map[&field_id].clone())
+        })
+        .map(Arc::new)
+        .collect_vec();
+
+    Ok(StructType::new(sorted_struct_fields))
+}
+
+fn is_void_transform(field: &PartitionField) -> bool {
+    field.transform == Transform::Void
+}
+
+fn equivalent_ignoring_name(field: &PartitionField, another_field: &PartitionField) -> bool {
+    field.field_id == another_field.field_id
+        && field.source_id == another_field.source_id
+        && compatible_transforms(field.transform, another_field.transform)
+}
+
+fn compatible_transforms(t1: Transform, t2: Transform) -> bool {
+    t1 == t2 || t1 == Transform::Void || t2 == Transform::Void
+}
+
+// Collects IDs of all partition field used across specs
+fn all_field_ids(vec: &[PartitionSpecRef]) -> HashSet<i32> {
+    vec.iter()
+        .flat_map(|partition_spec| partition_spec.fields())
+        .map(|partition_field| partition_field.field_id)
+        .collect()
+}
+
 #[cfg(test)]
 mod tests {
     use super::*;
-    use crate::spec::{PrimitiveType, Type};
+    use crate::spec::{FormatVersion, PrimitiveType, SortOrder, TableMetadataBuilder, Type};
 
     #[test]
     fn test_partition_spec() {
@@ -1733,4 +1856,172 @@ mod tests {
         assert_eq!(1002, spec.fields[1].field_id);
         assert!(!spec.has_sequential_ids());
     }
+
+    #[test]
+    fn test_combine_partition_type() -> Result<()> {
+        let schema = Schema::builder()
+            .with_fields(vec![
+                NestedField::required(1, "id", Type::Primitive(PrimitiveType::Int)).into(),
+                NestedField::required(2, "name", Type::Primitive(PrimitiveType::String)).into(),
+                NestedField::required(3, "ts", Type::Primitive(PrimitiveType::Timestamp)).into(),
+            ])
+            .build()?;
+
+        let metadata = TableMetadataBuilder::new(
+            schema,
+            PartitionSpec::unpartition_spec(),
+            SortOrder::unsorted_order(),
+            "my_location".to_string(),
+            FormatVersion::V2,
+            HashMap::new(),
+        )?
+        .add_partition_spec(
+            UnboundPartitionSpec::builder()
+                .with_spec_id(1)
+                .add_partition_fields(vec![
+                    UnboundPartitionField {
+                        source_id: 1,
+                        field_id: Some(1001),
+                        name: "id_bucket".to_string(),
+                        transform: Transform::Bucket(16),
+                    },
+                    UnboundPartitionField {
+                        source_id: 1,
+                        field_id: Some(1002),
+                        name: "id_truncate".to_string(),
+                        transform: Transform::Truncate(4),
+                    },
+                ])?
+                .build(),
+        )?
+        .add_partition_spec(
+            UnboundPartitionSpec::builder()
+                .with_spec_id(2)
+                .add_partition_fields(vec![UnboundPartitionField {
+                    source_id: 3,
+                    field_id: Some(1000),
+                    name: "ts_day".to_string(),
+                    transform: Transform::Day,
+                }])?
+                .build(),
+        )?
+        // Spec id 3 overrides a partition field name with the same id
+        // We'll later assert that the new name is used instead of the old one
+        .add_partition_spec(
+            UnboundPartitionSpec::builder()
+                .with_spec_id(3)
+                .add_partition_fields(vec![UnboundPartitionField {
+                    source_id: 3,
+                    field_id: Some(1000),
+                    name: "ts_day_overridden".to_string(),
+                    transform: Transform::Day,
+                }])?
+                .build(),
+        )?
+        // Add a void transform
+        .add_partition_spec(
+            UnboundPartitionSpec::builder()
+                .with_spec_id(4)
+                .add_partition_fields(vec![UnboundPartitionField {
+                    source_id: 2,
+                    field_id: Some(9999),
+                    name: "name_partition".to_string(),
+                    transform: Transform::Void,
+                }])?
+                .build(),
+        )?
+        // Newer partition fields can override partition void fields
+        .add_partition_spec(
+            UnboundPartitionSpec::builder()
+                .with_spec_id(5)
+                .add_partition_fields(vec![UnboundPartitionField {
+                    source_id: 2,
+                    field_id: Some(9999),
+                    name: "name_partition".to_string(),
+                    transform: Transform::Identity,
+                }])?
+                .build(),
+        )?
+        .build()?
+        .metadata;
+
+        assert_eq!(
+            partition_type(&metadata)?,
+            // Assert that fields are sorted
+            StructType::new(vec![
+                NestedField::optional(
+                    1000,
+                    "ts_day_overridden",
+                    Type::Primitive(PrimitiveType::Date),
+                )
+                .into(),
+                NestedField::optional(1001, "id_bucket", Type::Primitive(PrimitiveType::Int),)
+                    .into(),
+                NestedField::optional(1002, "id_truncate", Type::Primitive(PrimitiveType::Int),)
+                    .into(),
+                NestedField::optional(
+                    9999,
+                    "name_partition",
+                    Type::Primitive(PrimitiveType::String),
+                )
+                .into(),
+            ])
+        );
+
+        Ok(())
+    }
+
+    #[test]
+    fn test_combine_partition_type_incompatible_specs() -> Result<()> {
+        let metadata = TableMetadataBuilder::new(
+            Schema::builder()
+                .with_fields(vec![NestedField::required(
+                    1,
+                    "id",
+                    Type::Primitive(PrimitiveType::Int),
+                )
+                .into()])
+                .build()?,
+            PartitionSpec::unpartition_spec(),
+            SortOrder::unsorted_order(),
+            "my_location".to_string(),
+            FormatVersion::V2,
+            HashMap::new(),
+        )?
+        .add_partition_spec(
+            UnboundPartitionSpec::builder()
+                .with_spec_id(1)
+                .add_partition_fields(vec![UnboundPartitionField {
+                    source_id: 1,
+                    field_id: Some(2),
+                    name: "id_bucket".to_string(),
+                    transform: Transform::Bucket(4),
+                }])?
+                .build(),
+        )?
+        // Change the partition field incompatibly
+        .add_partition_spec(
+            UnboundPartitionSpec::builder()
+                .with_spec_id(2)
+                .add_partition_fields(vec![UnboundPartitionField {
+                    source_id: 1,
+                    field_id: Some(2),
+                    name: "id_bucket".to_string(),
+                    // Change bucket[4] to bucket[8]
+                    transform: Transform::Bucket(8),
+                }])?
+                .build(),
+        )?
+        .build()?
+        .metadata;
+
+        let result = partition_type(&metadata);
+
+        assert!(result
+            .unwrap_err()
+            .to_string()
+            .contains("Conflicting partition fields"));
+
+        Ok(())
+    }
 }

From c6f0c0671490be2685a56be4b61c5c0053061660 Mon Sep 17 00:00:00 2001
From: Willi Raschkowski <wraschkowski@palantir.com>
Date: Thu, 13 Mar 2025 02:02:47 +0000
Subject: [PATCH 3/3] Update comments

---
 crates/iceberg/src/inspect/metrics.rs | 2 +-
 crates/iceberg/src/scan.rs            | 7 +++----
 2 files changed, 4 insertions(+), 5 deletions(-)

diff --git a/crates/iceberg/src/inspect/metrics.rs b/crates/iceberg/src/inspect/metrics.rs
index ee0d37378..d7d6d4d76 100644
--- a/crates/iceberg/src/inspect/metrics.rs
+++ b/crates/iceberg/src/inspect/metrics.rs
@@ -416,7 +416,7 @@ impl ReadableColumnMetricsStructBuilder {
     }
 }
 
-/// Helper to serve increment field ids.
+/// Helper to serve incrementing field ids.
 struct IncrementingFieldId(i32);
 
 impl IncrementingFieldId {
diff --git a/crates/iceberg/src/scan.rs b/crates/iceberg/src/scan.rs
index cfcf45af9..b2b01eba5 100644
--- a/crates/iceberg/src/scan.rs
+++ b/crates/iceberg/src/scan.rs
@@ -1287,10 +1287,9 @@ pub mod tests {
                                 .record_count(1)
                                 .partition(Struct::from_iter([Some(Literal::long(100))]))
                                 .key_metadata(None)
-                                // Note:
-                                // The bounds below need to agree with the test data written below
-                                // into the Parquet file. If not, tests that rely on filter scans
-                                // fail because of wrong bounds.
+                                // Note: The bounds below need to agree with the test data written
+                                // into the Parquet file below. If not, tests that rely on filter
+                                // scans will fail because of wrong bounds.
                                 .lower_bounds(HashMap::from([
                                     (1, Datum::long(1)),
                                     (2, Datum::long(2)),