diff --git a/Cargo.toml b/Cargo.toml
index b4a3d486..5ad039e5 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -27,7 +27,6 @@ members = [
     "mutable_batch",
     "object_store_mem_cache",
     "object_store_metrics",
-    "observability_deps",
     "panic_logging",
     "parquet_file",
     "predicate",
diff --git a/arrow_util/Cargo.toml b/arrow_util/Cargo.toml
index 8458a19c..aea9d1ff 100644
--- a/arrow_util/Cargo.toml
+++ b/arrow_util/Cargo.toml
@@ -22,7 +22,7 @@ comfy-table = { version = "7.1", default-features = false }
 hashbrown = { workspace = true }
 num-traits = "0.2"
 parquet = { workspace = true }
-regex = "1.11.1"
+regex = "1.11.2"
 snafu = "0.8"
 uuid = "1"
 workspace-hack = { version = "0.1", path = "../workspace-hack" }
diff --git a/authz/Cargo.toml b/authz/Cargo.toml
index 7d377ebe..cc8333fd 100644
--- a/authz/Cargo.toml
+++ b/authz/Cargo.toml
@@ -28,7 +28,7 @@ assert_matches = "1.5.0"
 parking_lot = "0.12.4"
 paste = "1.0.15"
 test_helpers_authz = { path = "../test_helpers_authz" }
-tokio = "1.47.0"
+tokio = "1.47.1"
 
 [features]
 http = ["dep:http"]
diff --git a/backoff/src/lib.rs b/backoff/src/lib.rs
index 41e2aaf3..09321795 100644
--- a/backoff/src/lib.rs
+++ b/backoff/src/lib.rs
@@ -126,21 +126,6 @@ impl Backoff {
         }
     }
 
-    /// Fade this backoff over to a different backoff config.
-    pub fn fade_to(&mut self, config: &BackoffConfig) {
-        // Note: `new` won't have the same RNG, but this doesn't matter
-        let new = Self::new(config);
-
-        *self = Self {
-            init_backoff: new.init_backoff,
-            next_backoff_secs: self.next_backoff_secs,
-            max_backoff_secs: new.max_backoff_secs,
-            base: new.base,
-            deadline: new.deadline,
-            rng: self.rng.take(),
-        };
-    }
-
     /// Perform an async operation that retries with a backoff
     pub async fn retry_with_backoff<F, F1, B, E>(
         &mut self,
diff --git a/catalog_cache/benches/list_encode.rs b/catalog_cache/benches/list_encode.rs
index 7740e5fc..17a4d009 100644
--- a/catalog_cache/benches/list_encode.rs
+++ b/catalog_cache/benches/list_encode.rs
@@ -131,6 +131,7 @@ fn encode_partition_snapshot(i: usize) -> Bytes {
         Default::default(),
         Default::default(),
         Default::default(),
+        None, // max_time
     );
     // Create associated Parquet files:
     let parquet_files = vec![
diff --git a/client_util/Cargo.toml b/client_util/Cargo.toml
index 8d5dc7a9..ff2c1341 100644
--- a/client_util/Cargo.toml
+++ b/client_util/Cargo.toml
@@ -15,9 +15,9 @@ iox_http_util = { path = "../iox_http_util" }
 reqwest = { workspace = true, features = ["stream", "rustls-tls-native-roots"] }
 # This direct dependency on rustls can probably be removed when tonic is upgraded to 0.13+.
 # See <https://github.com/influxdata/influxdb_iox/issues/14683> for more details.
-rustls = { version = "0.23", default-features = false, features = ["ring", "std", "logging", "tls12"] }
-thiserror = "2.0.12"
-tonic = { version = "0.12", features = ["tls", "tls-native-roots"] }
+rustls = { version = "0.23", default-features = false }
+thiserror = "2.0.16"
+tonic = { version = "0.12", features = ["gzip", "tls", "tls-native-roots", "zstd"] }
 tower = { workspace = true }
 workspace-hack = { version = "0.1", path = "../workspace-hack" }
 
diff --git a/data_types/Cargo.toml b/data_types/Cargo.toml
index e2c9af59..bdfe3750 100644
--- a/data_types/Cargo.toml
+++ b/data_types/Cargo.toml
@@ -21,7 +21,7 @@ generated_types = { path = "../generated_types" }
 murmur3 = "0.5.2"
 tracing = { workspace = true }
 ordered-float = "5"
-percent-encoding = "2.3.1"
+percent-encoding = "2.3.2"
 prost = { workspace = true }
 schema = { path = "../schema" }
 serde_json = "1.0"
@@ -33,7 +33,7 @@ sqlx = { workspace = true, features = [
     "postgres",
     "uuid",
 ] }
-thiserror = "2.0.12"
+thiserror = "2.0.16"
 uuid = { version = "1", features = ["v4"] }
 workspace-hack = { version = "0.1", path = "../workspace-hack" }
 
diff --git a/data_types/src/lib.rs b/data_types/src/lib.rs
index 7509ac96..e6473dcf 100644
--- a/data_types/src/lib.rs
+++ b/data_types/src/lib.rs
@@ -25,9 +25,9 @@ pub use service_limits::*;
 
 use generated_types::google::protobuf as google;
 use generated_types::influxdata::iox::{
-    Target, catalog::v1 as catalog_proto, catalog_storage::v1 as catalog_storage_proto,
-    schema::v1 as schema_proto, skipped_compaction::v1 as skipped_compaction_proto,
-    table::v1 as table_proto,
+    Target, catalog::v1 as catalog_proto, catalog::v2 as catalog_v2_proto,
+    catalog_storage::v1 as catalog_storage_proto, schema::v1 as schema_proto,
+    skipped_compaction::v1 as skipped_compaction_proto, table::v1 as table_proto,
 };
 use schema::TIME_COLUMN_NAME;
 use snafu::Snafu;
@@ -383,6 +383,13 @@ impl NamespaceVersion {
     }
 }
 
+impl Add<i64> for NamespaceVersion {
+    type Output = Self;
+    fn add(self, rhs: i64) -> Self {
+        Self(self.0 + rhs)
+    }
+}
+
 /// Data object for a namespace
 #[derive(Debug, Clone, PartialEq, sqlx::FromRow)]
 pub struct Namespace {
@@ -747,6 +754,8 @@ pub struct TableWithStorage {
     pub deleted_at: Option<Timestamp>,
     /// The total number of active columns in this table.
     pub column_count: i64,
+    /// Whether this table is enabled for an iceberg export.
+    pub iceberg_enabled: bool,
 }
 
 /// Serialise a [`TableWithStorage`] object into its protobuf representation.
@@ -760,6 +769,7 @@ impl From<TableWithStorage> for catalog_storage_proto::TableWithStorage {
             size_bytes: value.size_bytes,
             deleted_at: value.deleted_at.map(google::Timestamp::from),
             column_count: value.column_count,
+            iceberg_enabled: value.iceberg_enabled,
         }
     }
 }
@@ -784,6 +794,7 @@ impl TryFrom<catalog_storage_proto::TableWithStorage> for TableWithStorage {
             size_bytes: value.size_bytes,
             deleted_at: value.deleted_at.map(Timestamp::from),
             column_count: value.column_count,
+            iceberg_enabled: value.iceberg_enabled,
         })
     }
 }
@@ -961,6 +972,52 @@ impl From<skipped_compaction_proto::SkippedCompaction> for SkippedCompaction {
     }
 }
 
+/// Pre-computed retention info for efficient retention queries on a partition.
+/// Stores the computed retention boundaries for both parquet files and partitions
+/// to eliminate O(namespaces × partitions) retention query complexity.
+#[derive(Debug, Clone, Copy, PartialEq, Eq, sqlx::FromRow)]
+pub struct PartitionRetention {
+    /// The partition this retention info applies to
+    pub partition_id: PartitionId,
+    /// The namespace this partition belongs to
+    pub namespace_id: NamespaceId,
+    /// Cached namespace retention period to avoid joins.
+    /// NULL when we don't want to slow down partition creation.
+    pub retention_period_ns: Option<i64>,
+    /// When files in this partition start becoming eligible for deletion.
+    /// NULL indicates this needs to be computed.
+    pub retention_start_time_ns: Option<i64>,
+    /// When files in this partition finish becoming eligible for deletion.
+    /// Currently always NULL for parquet file retention.
+    pub retention_end_time_ns: Option<i64>,
+}
+
+impl From<PartitionRetention> for catalog_v2_proto::PartitionRetention {
+    fn from(retention: PartitionRetention) -> Self {
+        Self {
+            partition_id: retention.partition_id.get(),
+            namespace_id: retention.namespace_id.get(),
+            retention_period_ns: retention.retention_period_ns,
+            retention_start_time_ns: retention.retention_start_time_ns,
+            retention_end_time_ns: retention.retention_end_time_ns,
+        }
+    }
+}
+
+impl TryFrom<catalog_v2_proto::PartitionRetention> for PartitionRetention {
+    type Error = &'static str;
+
+    fn try_from(retention: catalog_v2_proto::PartitionRetention) -> Result<Self, Self::Error> {
+        Ok(Self {
+            partition_id: PartitionId::new(retention.partition_id),
+            namespace_id: NamespaceId::new(retention.namespace_id),
+            retention_period_ns: retention.retention_period_ns,
+            retention_start_time_ns: retention.retention_start_time_ns,
+            retention_end_time_ns: retention.retention_end_time_ns,
+        })
+    }
+}
+
 /// Whether the file was created via bulk ingest or not (For now. This may be expanded to
 /// distinguish between ingester and compactor in the future).
 ///
@@ -3440,6 +3497,7 @@ mod tests {
             size_bytes: 1,
             deleted_at: None,
             column_count: 1,
+            iceberg_enabled: false,
         };
         let catalog_proto_table =
             catalog_storage_proto::TableWithStorage::from(table_active.clone());
@@ -3455,6 +3513,7 @@ mod tests {
             size_bytes: 2,
             deleted_at: Some(Timestamp::new(1_000_000_001)),
             column_count: 2,
+            iceberg_enabled: false,
         };
         let catalog_proto_table =
             catalog_storage_proto::TableWithStorage::from(table_deleted.clone());
diff --git a/data_types/src/partition.rs b/data_types/src/partition.rs
index 0e040d5a..5966a756 100644
--- a/data_types/src/partition.rs
+++ b/data_types/src/partition.rs
@@ -610,6 +610,10 @@ pub struct Partition {
     /// The time at which this partition was created, or `None` if this partition was created before
     /// this field existed.
     created_at: Option<Timestamp>,
+
+    /// The maximum time of data that can exist in this partition based on the partition template.
+    /// This is calculated when the partition is created and used for efficient retention queries.
+    pub max_time: Option<i64>,
 }
 
 impl Partition {
@@ -627,6 +631,7 @@ impl Partition {
         new_file_at: Option<Timestamp>,
         cold_compact_at: Option<Timestamp>,
         created_at: Option<Timestamp>,
+        max_time: Option<i64>,
     ) -> Self {
         Self {
             id,
@@ -637,6 +642,7 @@ impl Partition {
             new_file_at,
             cold_compact_at,
             created_at,
+            max_time,
         }
     }
 
diff --git a/data_types/src/partition_template.rs b/data_types/src/partition_template.rs
index a4eb3ccd..45761892 100644
--- a/data_types/src/partition_template.rs
+++ b/data_types/src/partition_template.rs
@@ -180,7 +180,7 @@ use std::{
     cmp::min,
     collections::{HashMap, HashSet},
     fmt::{Display, Formatter, Write},
-    ops::{Add, Range},
+    ops::Range,
     sync::{Arc, LazyLock},
 };
 
@@ -1470,7 +1470,7 @@ impl PartitionDuration {
     }
 }
 
-impl<Tz: chrono::TimeZone> Add<PartitionDuration> for chrono::DateTime<Tz> {
+impl<Tz: chrono::TimeZone> std::ops::Add<PartitionDuration> for chrono::DateTime<Tz> {
     type Output = Self;
     /// Add a [`PartitionDuration`] to a [`chrono::DateTime`].
     fn add(self, rhs: PartitionDuration) -> Self::Output {
diff --git a/data_types/src/snapshot/list.rs b/data_types/src/snapshot/list.rs
index c494a26a..c2e59114 100644
--- a/data_types/src/snapshot/list.rs
+++ b/data_types/src/snapshot/list.rs
@@ -3,8 +3,11 @@
 use bytes::Bytes;
 use prost::Message;
 use snafu::{Snafu, ensure};
-use std::marker::PhantomData;
-use std::ops::Range;
+use std::{
+    cmp::Ordering,
+    marker::PhantomData,
+    ops::{Deref, Range},
+};
 
 use generated_types::influxdata::iox::catalog_cache::v1 as generated;
 
@@ -29,6 +32,51 @@ pub enum Error {
     },
 }
 
+/// How to get the `i64` identifier to enable `MessageList::get_by_id`
+pub trait GetId {
+    /// The ID value for this instance that may be used for lookup by `MessageList::get_by_id`
+    fn id(&self) -> i64;
+}
+
+/// Ensures a list is sorted by ID, which is necessary for the binary search by ID
+#[derive(Clone, Eq, PartialEq, Debug)]
+pub struct SortedById<T: Message + Default + GetId> {
+    values: Vec<T>,
+}
+
+impl<T: Message + Default + GetId> SortedById<T> {
+    /// Create a new instance sorted by the ID of the items, which `MessageList` relies on for
+    /// its implementation of `get_by_id`.
+    pub fn new(mut values: Vec<T>) -> Self {
+        values.sort_unstable_by_key(|v| v.id());
+
+        SortedById { values }
+    }
+}
+
+impl<T: Message + Default + GetId> FromIterator<T> for SortedById<T> {
+    fn from_iter<I: IntoIterator<Item = T>>(iter: I) -> Self {
+        Self::new(Vec::from_iter(iter))
+    }
+}
+
+impl<T: Message + Default + GetId> Deref for SortedById<T> {
+    type Target = [T];
+
+    fn deref(&self) -> &Self::Target {
+        self.values.deref()
+    }
+}
+
+impl<T: Message + Default + GetId> IntoIterator for SortedById<T> {
+    type Item = T;
+    type IntoIter = std::vec::IntoIter<T>;
+
+    fn into_iter(self) -> Self::IntoIter {
+        self.values.into_iter()
+    }
+}
+
 /// Error type for [`MessageList`]
 pub type Result<T, E = Error> = std::result::Result<T, E>;
 
@@ -42,22 +90,22 @@ pub type Result<T, E = Error> = std::result::Result<T, E>;
 /// by arrow, that provides this and is designed to be combined with [`prost`]'s support
 /// for zero-copy decoding of [`Bytes`]
 #[derive(Clone, Eq, PartialEq)]
-pub struct MessageList<T: Message + Default> {
+pub struct MessageList<T: Message + Default + GetId> {
     len: usize,
     offsets: Bytes,
     values: Bytes,
     phantom: PhantomData<T>,
 }
 
-impl<T: Message + Default> MessageList<T> {
+impl<T: Message + Default + GetId> MessageList<T> {
     /// Encode `values` to a [`MessageList`]
-    pub fn encode(values: &[T]) -> Result<Self> {
+    pub fn encode(values: SortedById<T>) -> Result<Self> {
         let cap = (values.len() + 1) * 4;
         let mut offsets: Vec<u8> = Vec::with_capacity(cap);
         offsets.extend_from_slice(&0_u32.to_le_bytes());
 
         let mut cap = 0;
-        for x in values {
+        for x in values.iter() {
             cap += x.encoded_len();
             let offset = u32::try_from(cap).unwrap();
             offsets.extend_from_slice(&offset.to_le_bytes());
@@ -99,9 +147,56 @@ impl<T: Message + Default> MessageList<T> {
         let data = self.values.slice(start..end);
         Ok(T::decode(data)?)
     }
+
+    /// Returns the element with ID `id` found via binary search. Implemented by hand rather than
+    /// calling `std::slice::binary_search_by` to avoid needing to allocate a vector to create a
+    /// slice to call `binary_search_by` on. This code was largely copied from the stdlib's
+    /// implementation of `binary_search_by` as of Rust 1.89.0.
+    pub fn get_by_id(&self, id: i64) -> Result<Option<T>> {
+        let mut size = self.len();
+        if size == 0 {
+            return Ok(None);
+        }
+        let mut base = 0usize;
+
+        // This loop intentionally doesn't have an early exit if the comparison
+        // returns Equal. We want the number of loop iterations to depend *only*
+        // on the size of the input slice so that the CPU can reliably predict
+        // the loop count.
+        while size > 1 {
+            let half = size / 2;
+            let mid = base + half;
+
+            let current_item = self.get(mid)?;
+            let cmp = current_item.id().cmp(&id);
+
+            // Binary search interacts poorly with branch prediction, so force
+            // the compiler to use conditional moves if supported by the target
+            // architecture.
+            base = std::hint::select_unpredictable(cmp == Ordering::Greater, base, mid);
+
+            // This is imprecise in the case where `size` is odd and the
+            // comparison returns Greater: the mid element still gets included
+            // by `size` even though it's known to be larger than the element
+            // being searched for.
+            //
+            // This is fine though: we gain more performance by keeping the
+            // loop iteration count invariant (and thus predictable) than we
+            // lose from considering one additional element.
+            size -= half;
+        }
+
+        let base_item = self.get(base)?;
+        let cmp = base_item.id().cmp(&id);
+        if cmp == Ordering::Equal {
+            Ok(Some(base_item))
+        } else {
+            Ok(None)
+        }
+    }
 }
 
-impl<T: Message + Default> std::fmt::Debug for MessageList<T> {
+impl<T: Message + Default + GetId> std::fmt::Debug for MessageList<T> {
     fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
         let mut l = f.debug_list();
         for idx in 0..self.len() {
@@ -111,7 +206,7 @@ impl<T: Message + Default> std::fmt::Debug for MessageList<T> {
     }
 }
 
-impl<T: Message + Default> From<generated::MessageList> for MessageList<T> {
+impl<T: Message + Default + GetId> From<generated::MessageList> for MessageList<T> {
     fn from(proto: generated::MessageList) -> Self {
         let len = (proto.offsets.len() / 4).saturating_sub(1);
         Self {
@@ -123,7 +218,7 @@ impl<T: Message + Default> From<generated::MessageList> for MessageList<T> {
     }
 }
 
-impl<T: Message + Default> From<MessageList<T>> for generated::MessageList {
+impl<T: Message + Default + GetId> From<MessageList<T>> for generated::MessageList {
     fn from(value: MessageList<T>) -> Self {
         Self {
             offsets: value.offsets,
@@ -132,7 +227,7 @@ impl<T: Message + Default> From<MessageList<T>> for generated::MessageList {
     }
 }
 
-impl<T: Message + Default> IntoIterator for MessageList<T> {
+impl<T: Message + Default + GetId> IntoIterator for MessageList<T> {
     type Item = Result<T>;
     type IntoIter = MessageListIter<T>;
 
@@ -146,12 +241,12 @@ impl<T: Message + Default> IntoIterator for MessageList<T> {
 
 /// [`Iterator`] for [`MessageList`]
 #[derive(Debug)]
-pub struct MessageListIter<T: Message + Default> {
+pub struct MessageListIter<T: Message + Default + GetId> {
     iter: Range<usize>,
     list: MessageList<T>,
 }
 
-impl<T: Message + Default> Iterator for MessageListIter<T> {
+impl<T: Message + Default + GetId> Iterator for MessageListIter<T> {
     type Item = Result<T>;
 
     fn next(&mut self) -> Option<Self::Item> {
@@ -167,18 +262,49 @@ impl<T: Message + Default> Iterator for MessageListIter<T> {
 mod tests {
     use super::*;
 
+    /// As a simple hack for ease of test setup, the ID of a string is its length.
+    impl GetId for String {
+        fn id(&self) -> i64 {
+            self.len() as i64
+        }
+    }
+
+    impl GetId for i32 {
+        fn id(&self) -> i64 {
+            *self as i64
+        }
+    }
+
     #[test]
     fn test_simple() {
-        let strings = ["", "test", "foo", "abc", "", "skd"];
-        let strings: Vec<_> = strings.into_iter().map(ToString::to_string).collect();
+        // Note this list is not sorted by ID (`len`)
+        let strings = ["", "test", "foo", "abcde", "z", "skedaddle"];
+        let strings: SortedById<_> = strings.into_iter().map(ToString::to_string).collect();
 
-        let encoded = MessageList::encode(&strings).unwrap();
+        let encoded = MessageList::encode(strings.clone()).unwrap();
 
-        assert_eq!(encoded.get(5).unwrap().as_str(), "skd");
-        assert_eq!(encoded.get(2).unwrap().as_str(), "foo");
         assert_eq!(encoded.get(0).unwrap().as_str(), "");
+        assert_eq!(encoded.get_by_id(0).unwrap().unwrap().as_str(), "");
+
+        assert_eq!(encoded.get(1).unwrap().as_str(), "z");
+        assert_eq!(encoded.get_by_id(1).unwrap().unwrap().as_str(), "z");
+
+        // there is no value with ID 2
+        assert!(encoded.get_by_id(2).unwrap().is_none());
+
+        assert_eq!(encoded.get(2).unwrap().as_str(), "foo");
+        assert_eq!(encoded.get_by_id(3).unwrap().unwrap().as_str(), "foo");
+
+        assert_eq!(encoded.get(3).unwrap().as_str(), "test");
+        assert_eq!(encoded.get_by_id(4).unwrap().unwrap().as_str(), "test");
+
+        assert_eq!(encoded.get(4).unwrap().as_str(), "abcde");
+        assert_eq!(encoded.get_by_id(5).unwrap().unwrap().as_str(), "abcde");
+
+        assert_eq!(encoded.get(5).unwrap().as_str(), "skedaddle");
+        assert_eq!(encoded.get_by_id(9).unwrap().unwrap().as_str(), "skedaddle");
 
-        let decoded: Vec<_> = encoded.clone().into_iter().map(Result::unwrap).collect();
+        let decoded: SortedById<_> = encoded.clone().into_iter().map(Result::unwrap).collect();
         assert_eq!(strings, decoded);
 
         let proto = generated::MessageList::from(encoded.clone());
@@ -189,8 +315,8 @@ mod tests {
         let invalid = MessageList::<i32>::from(proto);
         invalid.get(2).unwrap_err();
 
-        let strings: Vec<String> = vec![];
-        let encoded = MessageList::encode(&strings).unwrap();
+        let strings: SortedById<String> = SortedById::new(vec![]);
+        let encoded = MessageList::encode(strings).unwrap();
         assert_eq!(encoded.len(), 0);
         assert!(encoded.is_empty());
 
diff --git a/data_types/src/snapshot/namespace.rs b/data_types/src/snapshot/namespace.rs
index 50f36b7c..1496dbcf 100644
--- a/data_types/src/snapshot/namespace.rs
+++ b/data_types/src/snapshot/namespace.rs
@@ -12,7 +12,7 @@ use crate::{
 
 use super::{
     hash::{HashBuckets, HashBucketsEncoder},
-    list::MessageList,
+    list::{GetId, MessageList, SortedById},
 };
 
 /// Error for [`NamespaceSnapshot`]
@@ -57,6 +57,12 @@ pub enum Error {
 /// Result for [`NamespaceSnapshot`]
 pub type Result<T, E = Error> = std::result::Result<T, E>;
 
+impl GetId for proto::NamespaceTable {
+    fn id(&self) -> i64 {
+        self.id
+    }
+}
+
 /// A snapshot of a namespace
 #[derive(Debug, Clone)]
 pub struct NamespaceSnapshot {
@@ -80,7 +86,7 @@ impl NamespaceSnapshot {
         tables: impl IntoIterator<Item = Table>,
         generation: u64,
     ) -> Result<Self> {
-        let mut tables: Vec<_> = tables
+        let tables: SortedById<_> = tables
             .into_iter()
             .map(|t| proto::NamespaceTable {
                 id: t.id.get(),
@@ -88,8 +94,6 @@ impl NamespaceSnapshot {
                 deleted_at: t.deleted_at.map(|ts| ts.get()),
             })
             .collect();
-        // TODO(marco): wire up binary search to find table by ID
-        tables.sort_unstable_by_key(|t| t.id);
 
         let mut table_names = HashBucketsEncoder::new(tables.len());
         for (index, table) in tables.iter().enumerate() {
@@ -108,7 +112,7 @@ impl NamespaceSnapshot {
             deleted_at: namespace.deleted_at,
             partition_template: namespace.partition_template.as_proto().cloned(),
             router_version: namespace.router_version,
-            tables: MessageList::encode(&tables).context(TableEncodeSnafu)?,
+            tables: MessageList::encode(tables).context(TableEncodeSnafu)?,
             table_names: table_names.finish(),
             generation,
         })
@@ -170,10 +174,30 @@ impl NamespaceSnapshot {
         })
     }
 
+    /// Look up a [`NamespaceSnapshotTable`] by `TableId` using binary search of the list of
+    /// tables. _Does_ include soft-deleted entries.
+    ///
+    /// Hard-deleted tables may still appear in the table cache, but should NOT appear in
+    /// the namespace snapshot's tables, so this method must be used to check actual presence or
+    /// absence before looking up additional table information in the table cache.
+    ///
+    /// # Performance
+    ///
+    /// This method decodes each record the binary search needs to check, so may not be appropriate
+    /// for performance-sensitive use cases.
+    pub fn lookup_table_by_id(&self, id: TableId) -> Result<Option<NamespaceSnapshotTable>> {
+        // This requires that the tables are sorted by ID, which `encode` does.
+        Ok(self
+            .tables
+            .get_by_id(id.get())
+            .context(TableDecodeSnafu)?
+            .map(|t| t.into()))
+    }
+
     /// Lookup a [`NamespaceSnapshotTable`] by name. Does not include deleted entries.
     pub fn lookup_table_by_name(&self, name: &str) -> Result<Option<NamespaceSnapshotTable>> {
         for idx in self.table_names.lookup(name.as_bytes()) {
-            let table = self.tables.get(idx).context(TableEncodeSnafu)?;
+            let table = self.tables.get(idx).context(TableDecodeSnafu)?;
             if table.name == name.as_bytes() {
                 return Ok(Some(table.into()));
             }
@@ -198,7 +222,7 @@ impl NamespaceSnapshot {
             .map(|x| Duration::from_nanos(x as _))
     }
 
-    /// When this file was deleted if any
+    /// When this namespace was deleted if any
     pub fn deleted_at(&self) -> Option<Timestamp> {
         self.deleted_at
     }
diff --git a/data_types/src/snapshot/partition.rs b/data_types/src/snapshot/partition.rs
index 4644427c..23e30de5 100644
--- a/data_types/src/snapshot/partition.rs
+++ b/data_types/src/snapshot/partition.rs
@@ -1,11 +1,13 @@
 //! Snapshot definition for partitions
 
-use crate::snapshot::list::MessageList;
-use crate::snapshot::mask::{BitMask, BitMaskBuilder};
 use crate::{
     ColumnId, ColumnSet, CompactionLevelProtoError, NamespaceId, ObjectStoreId, ParquetFile,
     ParquetFileId, ParquetFileSource, Partition, PartitionHashId, PartitionHashIdError,
     PartitionId, PartitionKey, SkippedCompaction, SortKeyIds, TableId, Timestamp,
+    snapshot::{
+        list::{GetId, MessageList, SortedById},
+        mask::{BitMask, BitMaskBuilder},
+    },
 };
 use bytes::Bytes;
 use generated_types::influxdata::iox::{
@@ -43,6 +45,12 @@ pub enum Error {
 /// Result for [`PartitionSnapshot`]
 pub type Result<T, E = Error> = std::result::Result<T, E>;
 
+impl GetId for proto::PartitionFile {
+    fn id(&self) -> i64 {
+        self.id
+    }
+}
+
 /// A snapshot of a partition
 ///
 /// # Soft Deletion
@@ -94,7 +102,7 @@ impl PartitionSnapshot {
             acc
         });
 
-        let files = files
+        let files: SortedById<_> = files
             .into_iter()
             .map(|file| {
                 let mut mask = BitMaskBuilder::new(columns.len());
@@ -117,7 +125,7 @@ impl PartitionSnapshot {
                     use_numeric_partition_id: Some(file.partition_hash_id.is_none()),
                 }
             })
-            .collect::<Vec<_>>();
+            .collect();
 
         Ok(Self {
             generation,
@@ -126,7 +134,7 @@ impl PartitionSnapshot {
             partition_id: partition.id,
             partition_hash_id: partition.hash_id().cloned(),
             key: partition.partition_key.as_bytes().to_vec().into(),
-            files: MessageList::encode(&files).context(FileEncodeSnafu)?,
+            files: MessageList::encode(files).context(FileEncodeSnafu)?,
             sort_key: partition.sort_key_ids().cloned().unwrap_or_default(),
             table_id: partition.table_id,
             new_file_at: partition.new_file_at,
@@ -248,6 +256,7 @@ impl PartitionSnapshot {
             self.new_file_at,
             self.cold_compact_at,
             self.created_at,
+            None, // max_time - not stored in snapshot (can be computed from partition key)
         ))
     }
 
@@ -333,6 +342,7 @@ mod tests {
                 Default::default(),
                 Default::default(),
                 Default::default(),
+                None, // max_time
             );
             // Create associated Parquet files:
             let parquet_files = vec![
@@ -409,13 +419,13 @@ mod tests {
             use_numeric_partition_id: Some(true),
             ..parquet_file_missing_new_numeric_id_field_proto.clone()
         };
-
-        let files = MessageList::encode(&[
+        let parquet_files = SortedById::new(vec![
             parquet_file_missing_new_numeric_id_field_proto,
             parquet_file_new_numeric_id_field_false_proto,
             parquet_file_new_numeric_id_field_true_proto,
-        ])
-        .unwrap();
+        ]);
+
+        let files = MessageList::encode(parquet_files).unwrap();
         let files_proto: proto::MessageList = files.into();
 
         // Create cached proto for two different Partitions:
diff --git a/data_types/src/snapshot/root.rs b/data_types/src/snapshot/root.rs
index e72d8835..fa75874a 100644
--- a/data_types/src/snapshot/root.rs
+++ b/data_types/src/snapshot/root.rs
@@ -7,7 +7,7 @@ use crate::{Namespace, NamespaceId, Timestamp};
 
 use super::{
     hash::{HashBuckets, HashBucketsEncoder},
-    list::MessageList,
+    list::{GetId, MessageList, SortedById},
 };
 
 /// Error for [`RootSnapshot`]
@@ -33,6 +33,12 @@ pub enum Error {
 /// Result for [`RootSnapshot`]
 pub type Result<T, E = Error> = std::result::Result<T, E>;
 
+impl GetId for proto::RootNamespace {
+    fn id(&self) -> i64 {
+        self.id
+    }
+}
+
 /// A snapshot of root.
 ///
 /// # Soft Deletion
@@ -52,7 +58,7 @@ impl RootSnapshot {
         namespaces: impl IntoIterator<Item = Namespace>,
         generation: u64,
     ) -> Result<Self> {
-        let mut namespaces: Vec<_> = namespaces
+        let namespaces: SortedById<_> = namespaces
             .into_iter()
             .map(|ns| proto::RootNamespace {
                 id: ns.id.get(),
@@ -61,9 +67,6 @@ impl RootSnapshot {
             })
             .collect();
 
-        // This sort is required for the binary search in `lookup_namespace_by_id` to function.
-        namespaces.sort_unstable_by_key(|ns| ns.id);
-
         let mut namespace_names = HashBucketsEncoder::new(namespaces.len());
         for (index, ns) in namespaces.iter().enumerate() {
             // exclude soft-deleted entries from name table
@@ -73,7 +76,7 @@ impl RootSnapshot {
         }
 
         Ok(Self {
-            namespaces: MessageList::encode(&namespaces).context(NamespaceEncodeSnafu)?,
+            namespaces: MessageList::encode(namespaces).context(NamespaceEncodeSnafu)?,
             namespace_names: namespace_names.finish(),
             generation,
         })
@@ -113,31 +116,11 @@ impl RootSnapshot {
     /// for performance-sensitive use cases.
     pub fn lookup_namespace_by_id(&self, id: NamespaceId) -> Result<Option<RootSnapshotNamespace>> {
         // This requires that the namespaces are sorted by ID, which `encode` does.
-
-        // Search through a slice of indices, as there isn't a way to get a slice of `&T` from
-        // `MessageList` without decoding everything
-        let indices_to_search: Vec<_> = (0..self.namespaces.len()).collect();
-
-        let element_idx = indices_to_search.binary_search_by_key(&id.get(), |&idx| {
-            let namespace_snapshot = self
-                .namespaces
-                .get(idx)
-                // The binary search APIs expect the comparator functions to be infallible. If
-                // decoding of cache records fails, we have bigger problems than only not being
-                // able to do a binary search, so go ahead and panic.
-                .expect("decoding root namespaces for binary search should succeed");
-            namespace_snapshot.id
-        });
-
-        element_idx
-            .ok()
-            .map(|idx| {
-                self.namespaces
-                    .get(idx)
-                    .context(NamespaceDecodeSnafu)
-                    .map(|t| t.into())
-            })
-            .transpose()
+        Ok(self
+            .namespaces
+            .get_by_id(id.get())
+            .context(NamespaceDecodeSnafu)?
+            .map(|ns| ns.into()))
     }
 
     /// Lookup a [`RootSnapshotNamespace`] by name. Does not include deleted entries.
diff --git a/data_types/src/snapshot/table.rs b/data_types/src/snapshot/table.rs
index d69cb4fb..afce4ac2 100644
--- a/data_types/src/snapshot/table.rs
+++ b/data_types/src/snapshot/table.rs
@@ -1,8 +1,8 @@
 //! Snapshot definition for tables
-use crate::snapshot::list::MessageList;
 use crate::{
     Column, ColumnId, ColumnTypeProtoError, NamespaceId, Partition, PartitionId, PartitionKey,
     Table, TableId, Timestamp,
+    snapshot::list::{GetId, MessageList, SortedById},
 };
 use bytes::Bytes;
 use generated_types::influxdata::iox::catalog_cache::v1 as proto;
@@ -52,6 +52,18 @@ pub enum Error {
 /// Result for [`TableSnapshot`]
 pub type Result<T, E = Error> = std::result::Result<T, E>;
 
+impl GetId for proto::TablePartition {
+    fn id(&self) -> i64 {
+        self.id
+    }
+}
+
+impl GetId for proto::TableColumn {
+    fn id(&self) -> i64 {
+        self.id
+    }
+}
+
 /// A snapshot of a table
 #[derive(Debug, Clone)]
 pub struct TableSnapshot {
@@ -74,7 +86,7 @@ impl TableSnapshot {
         columns: Vec<Column>,
         generation: u64,
     ) -> Result<Self> {
-        let columns: Vec<_> = columns
+        let columns: SortedById<_> = columns
             .into_iter()
             .map(|c| proto::TableColumn {
                 id: c.id.get(),
@@ -83,7 +95,7 @@ impl TableSnapshot {
             })
             .collect();
 
-        let partitions: Vec<_> = partitions
+        let partitions: SortedById<_> = partitions
             .into_iter()
             .map(|p| proto::TablePartition {
                 id: p.id.get(),
@@ -95,8 +107,8 @@ impl TableSnapshot {
             table_id: table.id,
             namespace_id: table.namespace_id,
             table_name: table.name.into(),
-            partitions: MessageList::encode(&partitions).context(PartitionEncodeSnafu)?,
-            columns: MessageList::encode(&columns).context(ColumnEncodeSnafu)?,
+            partitions: MessageList::encode(partitions).context(PartitionEncodeSnafu)?,
+            columns: MessageList::encode(columns).context(ColumnEncodeSnafu)?,
             partition_template: table.partition_template.as_proto().cloned(),
             iceberg_enabled: table.iceberg_enabled,
             generation,
@@ -193,6 +205,11 @@ impl TableSnapshot {
     pub fn table_id(&self) -> TableId {
         self.table_id
     }
+
+    /// When this table was deleted if any
+    pub fn deleted_at(&self) -> Option<Timestamp> {
+        self.deleted_at
+    }
 }
 
 /// Partition information stored within [`TableSnapshot`]
diff --git a/flightsql/src/cmd.rs b/flightsql/src/cmd.rs
index 2d8987e3..b98f85e9 100644
--- a/flightsql/src/cmd.rs
+++ b/flightsql/src/cmd.rs
@@ -1,6 +1,6 @@
 //! IOx FlightSQL Command structures
 
-use std::{collections::HashMap, fmt::Display};
+use std::{collections::HashMap, fmt::Display, slice};
 
 use arrow::{
     array::RecordBatch,
@@ -143,7 +143,7 @@ impl Display for PreparedStatementHandle {
             write!(
                 f,
                 ",{}",
-                pretty_format_batches(&[batch.clone()]).map_err(|_| std::fmt::Error)?
+                pretty_format_batches(slice::from_ref(batch)).map_err(|_| std::fmt::Error)?
             )?
         };
         write!(f, ")")
diff --git a/generated_types/Cargo.toml b/generated_types/Cargo.toml
index d4ae3445..1c96ac30 100644
--- a/generated_types/Cargo.toml
+++ b/generated_types/Cargo.toml
@@ -14,7 +14,7 @@ pbjson-types = { workspace = true }
 prost = { workspace = true }
 prost-types = { workspace = true }
 serde = { version = "1.0", features = ["derive"] }
-tonic = { version = "0.12", features = ["tls", "tls-roots"] }
+tonic = { version = "0.12", features = ["gzip", "tls", "tls-roots", "zstd"] }
 tracing = { workspace = true }
 uuid = { version = "1" }
 workspace-hack = { version = "0.1", path = "../workspace-hack" }
diff --git a/generated_types/protos/influxdata/iox/catalog/v2/service.proto b/generated_types/protos/influxdata/iox/catalog/v2/service.proto
index ddf45513..fdd3e31b 100644
--- a/generated_types/protos/influxdata/iox/catalog/v2/service.proto
+++ b/generated_types/protos/influxdata/iox/catalog/v2/service.proto
@@ -29,7 +29,12 @@ service CatalogService {
   rpc NamespaceDeleteOld(NamespaceDeleteOldRequest) returns (NamespaceDeleteOldResponse);
 
   rpc TableCreate(TableCreateRequest) returns (TableCreateResponse);
-  rpc TableGetById(TableGetByIdRequest) returns (TableGetByIdResponse);
+  rpc TableGetByIdAndNamespace(TableGetByIdAndNamespaceRequest) returns (TableGetByIdAndNamespaceResponse);
+  // Returns a table record regardless of its soft-deleted status. Essentially deprecated in favor
+  // of `TableGetByIdAndNamespace`.
+  rpc TableGetById(TableGetByIdRequest) returns (TableGetByIdResponse) {
+    option deprecated = true;
+  };
   rpc TableGetByNamespaceAndName(TableGetByNamespaceAndNameRequest) returns (TableGetByNamespaceAndNameResponse);
   rpc TableListByNamespaceId(TableListByNamespaceIdRequest) returns (stream TableListByNamespaceIdResponse);
   rpc TableList(TableListRequest) returns (stream TableListResponse);
@@ -48,12 +53,14 @@ service CatalogService {
   rpc ColumnList(ColumnListRequest) returns (stream ColumnListResponse);
 
   rpc PartitionCreateOrGet(PartitionCreateOrGetRequest) returns (PartitionCreateOrGetResponse);
+  rpc PartitionCreateOrGetBatch(PartitionCreateOrGetBatchRequest) returns (stream PartitionCreateOrGetBatchResponse);
   rpc PartitionGetByIdBatch(PartitionGetByIdBatchRequest) returns (stream PartitionGetByIdBatchResponse);
   rpc PartitionListByTableId(PartitionListByTableIdRequest) returns (stream PartitionListByTableIdResponse);
   rpc PartitionListIds(PartitionListIdsRequest) returns (stream PartitionListIdsResponse);
   rpc PartitionCasSortKey(PartitionCasSortKeyRequest) returns (PartitionCasSortKeyResponse);
   rpc PartitionRecordSkippedCompaction(PartitionRecordSkippedCompactionRequest) returns (PartitionRecordSkippedCompactionResponse);
   rpc PartitionGetInSkippedCompactions(PartitionGetInSkippedCompactionsRequest) returns (stream PartitionGetInSkippedCompactionsResponse);
+  rpc PartitionGetInSkippedCompactionsV2(stream PartitionGetInSkippedCompactionsV2Request) returns (stream PartitionGetInSkippedCompactionsV2Response);
   rpc PartitionListSkippedCompactions(PartitionListSkippedCompactionsRequest) returns (stream PartitionListSkippedCompactionsResponse);
   rpc PartitionDeleteSkippedCompactions(PartitionDeleteSkippedCompactionsRequest) returns (PartitionDeleteSkippedCompactionsResponse);
   rpc PartitionMostRecentN(PartitionMostRecentNRequest) returns (stream PartitionMostRecentNResponse);
@@ -65,6 +72,15 @@ service CatalogService {
   rpc PartitionSnapshot(PartitionSnapshotRequest) returns (PartitionSnapshotResponse);
   rpc PartitionMigrate(PartitionMigrateRequest) returns (PartitionMigrateResponse);
 
+  // Partition retention methods
+  rpc PartitionRetentionUpsert(PartitionRetentionUpsertRequest) returns (PartitionRetentionUpsertResponse);
+  rpc PartitionRetentionGetByPartitionId(PartitionRetentionGetByPartitionIdRequest) returns (PartitionRetentionGetByPartitionIdResponse);
+  rpc PartitionRetentionListPartitionsNeedingComputation(PartitionRetentionListPartitionsNeedingComputationRequest) returns (stream PartitionRetentionListPartitionsNeedingComputationResponse);
+  rpc PartitionRetentionReconcileMissingPartitions(PartitionRetentionReconcileMissingPartitionsRequest) returns (PartitionRetentionReconcileMissingPartitionsResponse);
+  rpc PartitionRetentionListPartitionsForParquetRetention(PartitionRetentionListPartitionsForParquetRetentionRequest) returns (stream PartitionRetentionListPartitionsForParquetRetentionResponse);
+  rpc PartitionRetentionListPartitionsForPartitionRetention(PartitionRetentionListPartitionsForPartitionRetentionRequest) returns (stream PartitionRetentionListPartitionsForPartitionRetentionResponse);
+  rpc PartitionRetentionInvalidateByNamespaceId(PartitionRetentionInvalidateByNamespaceIdRequest) returns (PartitionRetentionInvalidateByNamespaceIdResponse);
+
   rpc ParquetFileFlagForDeleteByRetention(ParquetFileFlagForDeleteByRetentionRequest) returns (stream ParquetFileFlagForDeleteByRetentionResponse);
   rpc ParquetFileDeleteOldIdsOnly(ParquetFileDeleteOldIdsOnlyRequest) returns (stream ParquetFileDeleteOldIdsOnlyResponse);
   rpc ParquetFileDeleteOldIdsCount(ParquetFileDeleteOldIdsCountRequest) returns (ParquetFileDeleteOldIdsCountResponse);
@@ -265,6 +281,16 @@ message TableCreateResponse {
   Table table = 1;
 }
 
+message TableGetByIdAndNamespaceRequest {
+  int64 table_id = 1;
+  int64 namespace_id = 2;
+  SoftDeletedRows deleted = 3;
+}
+
+message TableGetByIdAndNamespaceResponse {
+  Table table = 1;
+}
+
 message TableGetByIdRequest {
   int64 id = 1;
 }
@@ -334,6 +360,7 @@ message TableSoftDeleteRequest {
 
 message TableSoftDeleteResponse {
   Table table = 1;
+  int64 router_version = 2;
 }
 
 message TableRenameRequest {
@@ -343,6 +370,7 @@ message TableRenameRequest {
 
 message TableRenameResponse {
   Table table = 1;
+  int64 router_version = 2;
 }
 
 message TableUndeleteRequest {
@@ -351,6 +379,7 @@ message TableUndeleteRequest {
 
 message TableUndeleteResponse {
   Table table = 1;
+  int64 router_version = 2;
 }
 
 message ColumnCreateOrGetRequest {
@@ -405,6 +434,15 @@ message PartitionCreateOrGetResponse {
   Partition partition = 1;
 }
 
+message PartitionCreateOrGetBatchRequest {
+  repeated string keys = 1;
+  int64 table_id = 2;
+}
+
+message PartitionCreateOrGetBatchResponse {
+  Partition partition = 1;
+}
+
 message PartitionGetByIdBatchRequest {
   repeated int64 partition_ids = 1;
 }
@@ -464,10 +502,18 @@ message PartitionGetInSkippedCompactionsRequest {
   repeated int64 partition_ids = 1;
 }
 
+message PartitionGetInSkippedCompactionsV2Request {
+  int64 partition_id = 1;
+}
+
 message PartitionGetInSkippedCompactionsResponse {
   SkippedCompaction skipped_compaction = 1;
 }
 
+message PartitionGetInSkippedCompactionsV2Response {
+  SkippedCompaction skipped_compaction = 1;
+}
+
 message PartitionListSkippedCompactionsRequest {}
 
 message PartitionListSkippedCompactionsResponse {
@@ -735,6 +781,7 @@ message Partition {
   optional int64 new_file_at = 6;
   optional int64 cold_compact_at = 7;
   optional int64 created_at = 8;
+  optional int64 max_time = 9;
 }
 
 message SkippedCompaction {
@@ -810,3 +857,74 @@ message ParquetFile {
   int64 max_l0_created_at = 14;
   ParquetFileSource source = 17;
 }
+
+// Partition retention messages
+message PartitionRetention {
+  int64 partition_id = 1;
+  int64 namespace_id = 2;
+  optional int64 retention_period_ns = 3;
+  optional int64 retention_start_time_ns = 4;
+  optional int64 retention_end_time_ns = 5;
+}
+
+message PartitionRetentionUpsertRequest {
+  int64 partition_id = 1;
+  int64 namespace_id = 2;
+  optional int64 retention_period_ns = 3;
+  optional int64 retention_start_time_ns = 4;
+  optional int64 retention_end_time_ns = 5;
+}
+
+message PartitionRetentionUpsertResponse {
+  PartitionRetention partition_retention = 1;
+}
+
+message PartitionRetentionGetByPartitionIdRequest {
+  int64 partition_id = 1;
+}
+
+message PartitionRetentionGetByPartitionIdResponse {
+  optional PartitionRetention partition_retention = 1;
+}
+
+message PartitionRetentionListPartitionsNeedingComputationRequest {
+  int32 limit = 1;
+}
+
+message PartitionRetentionListPartitionsNeedingComputationResponse {
+  int64 partition_id = 1;
+}
+
+message PartitionRetentionReconcileMissingPartitionsRequest {
+  // Empty - no parameters needed
+}
+
+message PartitionRetentionReconcileMissingPartitionsResponse {
+  int32 reconciled_count = 1;
+}
+
+message PartitionRetentionListPartitionsForParquetRetentionRequest {
+  int64 cutoff_time_ns = 1;
+  int32 limit = 2;
+}
+
+message PartitionRetentionListPartitionsForParquetRetentionResponse {
+  int64 partition_id = 1;
+}
+
+message PartitionRetentionListPartitionsForPartitionRetentionRequest {
+  int64 cutoff_time_ns = 1;
+  int32 limit = 2;
+}
+
+message PartitionRetentionListPartitionsForPartitionRetentionResponse {
+  int64 partition_id = 1;
+}
+
+message PartitionRetentionInvalidateByNamespaceIdRequest {
+  int64 namespace_id = 1;
+}
+
+message PartitionRetentionInvalidateByNamespaceIdResponse {
+  int32 invalidated_count = 1;
+}
diff --git a/generated_types/protos/influxdata/iox/catalog_storage/v1/service.proto b/generated_types/protos/influxdata/iox/catalog_storage/v1/service.proto
index 8cee3822..66ad9ff7 100644
--- a/generated_types/protos/influxdata/iox/catalog_storage/v1/service.proto
+++ b/generated_types/protos/influxdata/iox/catalog_storage/v1/service.proto
@@ -219,4 +219,6 @@ message TableWithStorage {
 
     // Total number of active columns in this table.
     int64 column_count = 7;
+    
+    bool iceberg_enabled = 8;
 }
diff --git a/generated_types/protos/influxdata/iox/table/v1/service.proto b/generated_types/protos/influxdata/iox/table/v1/service.proto
index 4bf358a2..842918ef 100644
--- a/generated_types/protos/influxdata/iox/table/v1/service.proto
+++ b/generated_types/protos/influxdata/iox/table/v1/service.proto
@@ -84,15 +84,54 @@ message Table {
   optional google.protobuf.Timestamp deleted_at = 6;
 }
 
+enum TableStatusFilter {
+  TABLE_STATUS_FILTER_UNSPECIFIED = 0;
+  TABLE_STATUS_FILTER_ACTIVE = 1;
+  TABLE_STATUS_FILTER_DELETED = 2;
+}
+
+message TableStatusFilterList {
+  repeated TableStatusFilter inner = 1;
+}
+
 message GetTablesRequest {
   oneof target {
     // Name of the namespace to list tables for.
     string namespace_name = 1 [deprecated = true];
     // The unique ID of the namespace to list tables for.
     int64 namespace_id = 2;
-  }
-}
+  };
 
+  // How to filter deleted tables in the response of this request
+  // If there is nothing in this field, the returned tables aren't filtered at all;
+  // everything is returned.
+  // If there are items in this field, however, the only tables that are returned
+  // are those whose statuses are contained in this field.
+  //
+  // So, by default, no filtering is done.
+  //
+  // But if someone specified [Active, Deleted] in this field, that would return all
+  // tables which are either active or deleted. At time of writing, that includes all
+  // tables that can exist. However, at some point in the future, we may want to extend
+  // the granularity of this endpoint and allow customers to see all tables that are in
+  // the process of being deleted, or maybe all tables that are in the process of being
+  // created, or maybe we'll need to add some other status like 'hidden'. Who knows.
+  //
+  // With the `SoftDeleted` method of filtering, adding more statuses would cause
+  // exponential blowup with the number of variants that could occur, since we'd want to
+  // support any combination of statuses. With this, however, that extension becomes way
+  // easier and more backwards-compatible.
+  //
+  // We also want this to be, essentialy, an optional list because it allows us to be
+  // be sure that the client is always explicitly specifying their list of filters. If
+  // they leave a repeated field unspecified, we can't tell whether they just don't know
+  // about the filters or if they explicitly want no filters. But making it an optional
+  // allows us to force people to specify their filters, which is very nice for ensuring
+  // everyone is doing what they want.
+  //
+  // It also, for now, allows us to keep backwards-compatibilty, which is important.
+  optional TableStatusFilterList filters = 3;
+}
 message GetTableRequest {
   oneof namespace_target {
     // Name of the namespace to get a table from.
@@ -183,6 +222,9 @@ message DisableIcebergResponse {}
 
 message DeleteTableRequest {
   int64 table_id = 1;
+  // ID of the namespace this table is in. If not specified, the request may be slower as it will
+  // need to do more lookups.
+  int64 namespace_id = 2;
 }
 
 message DeleteTableResponse {
@@ -192,6 +234,9 @@ message DeleteTableResponse {
 message RenameTableRequest {
   int64 table_id = 1;
   string new_name = 2;
+  // ID of the namespace this table is in. If not specified, the request may be slower as it will
+  // need to do more lookups.
+  int64 namespace_id = 3;
 }
 
 message RenameTableResponse {
diff --git a/generated_types/src/lib.rs b/generated_types/src/lib.rs
index 4dfcabb7..19bbafe4 100644
--- a/generated_types/src/lib.rs
+++ b/generated_types/src/lib.rs
@@ -7,6 +7,7 @@
     clippy::large_enum_variant,
     clippy::use_self,
     clippy::allow_attributes,
+    clippy::uninlined_format_args,
     missing_copy_implementations
 )]
 
diff --git a/influxdb2_client/Cargo.toml b/influxdb2_client/Cargo.toml
index 090e0dc7..ddf07547 100644
--- a/influxdb2_client/Cargo.toml
+++ b/influxdb2_client/Cargo.toml
@@ -13,7 +13,7 @@ bytes = "1.10"
 futures = { version = "0.3", default-features = false }
 reqwest = { workspace = true, features = ["stream", "json", "rustls-tls-native-roots"] }
 serde = { version = "1.0", features = ["derive"] }
-serde_json = "1.0.141"
+serde_json = "1.0.143"
 snafu = "0.8"
 url = "2.5.3"
 uuid = { version = "1", features = ["v4"] }
diff --git a/influxdb_influxql_parser/Cargo.toml b/influxdb_influxql_parser/Cargo.toml
index 5cf47680..cbdd4057 100644
--- a/influxdb_influxql_parser/Cargo.toml
+++ b/influxdb_influxql_parser/Cargo.toml
@@ -18,7 +18,7 @@ num-integer = { version = "0.1", default-features = false, features = [
     "std",
 ] }
 num-traits = "0.2"
-thiserror = "2.0.12"
+thiserror = "2.0.16"
 workspace-hack = { version = "0.1", path = "../workspace-hack" }
 
 [dev-dependencies] # In alphabetical order
diff --git a/influxdb_iox_client/Cargo.toml b/influxdb_iox_client/Cargo.toml
index 67053ac0..cce819fa 100644
--- a/influxdb_iox_client/Cargo.toml
+++ b/influxdb_iox_client/Cargo.toml
@@ -42,14 +42,14 @@ prost = { workspace = true, optional = true }
 rand = { version = "0.9.2", optional = true }
 reqwest = { workspace = true, features = ["stream", "rustls-tls-native-roots"] }
 schema = { path = "../schema", optional = true }
-serde_json = { version = "1.0.141", optional = true }
+serde_json = { version = "1.0.143", optional = true }
 tokio = { version = "1.47", features = [
     "macros",
     "parking_lot",
     "rt-multi-thread",
 ] }
 tokio-stream = "0.1.17"
-thiserror = "2.0.12"
+thiserror = "2.0.16"
 tonic-reflection = { version = "0.12" }
 
 [dev-dependencies]
diff --git a/influxdb_iox_client/src/client/flight/mod.rs b/influxdb_iox_client/src/client/flight/mod.rs
index 30248a59..d2a4000b 100644
--- a/influxdb_iox_client/src/client/flight/mod.rs
+++ b/influxdb_iox_client/src/client/flight/mod.rs
@@ -28,6 +28,8 @@ pub mod generated_types {
     pub use generated_types::influxdata::iox::querier::v1::*;
 }
 
+pub use ::generated_types::tonic::codec::CompressionEncoding;
+
 /// Error responses when querying an IOx namespace using the IOx Flight API.
 #[derive(Debug, Error)]
 pub enum Error {
@@ -238,6 +240,20 @@ impl Client {
         Ok(self.inner.add_header(key, value)?)
     }
 
+    /// Accept compression.
+    ///
+    /// This is a set and the server will pick one option from it (plus the option "no compression").
+    pub fn accept_compressed(&mut self, encoding: CompressionEncoding) {
+        *self.inner.inner_mut() = self.inner.inner_mut().clone().accept_compressed(encoding);
+    }
+
+    /// Send compression.
+    ///
+    /// Only ONE compression can be send. Ask your server operator which encodings are supported.
+    pub fn send_compressed(&mut self, encoding: CompressionEncoding) {
+        *self.inner.inner_mut() = self.inner.inner_mut().clone().send_compressed(encoding);
+    }
+
     /// Create a new [`QueryBuilder`] to construct a query, optionally with parameters, on the
     /// given namespace
     pub fn query(&mut self, database: impl Into<String> + Send) -> QueryBuilder<'_, NoQuery> {
diff --git a/influxdb_iox_client/src/client/table.rs b/influxdb_iox_client/src/client/table.rs
index 2cc543e4..0fef4244 100644
--- a/influxdb_iox_client/src/client/table.rs
+++ b/influxdb_iox_client/src/client/table.rs
@@ -9,6 +9,7 @@ use ::generated_types::influxdata::iox::Target;
 /// Re-export generated_types
 pub mod generated_types {
     pub use generated_types::influxdata::iox::{
+        common::v1::SoftDeleted,
         partition_template::v1::{template_part::*, *},
         table::v1::*,
     };
@@ -32,11 +33,15 @@ impl Client {
     pub async fn get_tables(
         &mut self,
         namespace: impl Into<Target> + Send,
+        filters: Option<impl IntoIterator<Item = TableStatusFilter>>,
     ) -> Result<Vec<Table>, Error> {
         Ok(self
             .inner
             .get_tables(GetTablesRequest {
                 target: Some(namespace.into().into()),
+                filters: filters.map(|filters| TableStatusFilterList {
+                    inner: filters.into_iter().map(|f| f as i32).collect(),
+                }),
             })
             .await?
             .into_inner()
@@ -81,10 +86,17 @@ impl Client {
     }
 
     /// Soft delete a table
-    pub async fn soft_delete_table(&mut self, table_id: i64) -> Result<Table, Error> {
+    pub async fn soft_delete_table(
+        &mut self,
+        table_id: i64,
+        namespace_id: i64,
+    ) -> Result<Table, Error> {
         let response = self
             .inner
-            .delete_table(DeleteTableRequest { table_id })
+            .delete_table(DeleteTableRequest {
+                table_id,
+                namespace_id,
+            })
             .await?;
 
         Ok(response.into_inner().table.unwrap_field("table")?)
diff --git a/influxdb_line_protocol/src/v3/mod.rs b/influxdb_line_protocol/src/v3/mod.rs
index 315d3ed4..ee2b077b 100644
--- a/influxdb_line_protocol/src/v3/mod.rs
+++ b/influxdb_line_protocol/src/v3/mod.rs
@@ -263,10 +263,10 @@ fn field_family_normal_char(i: &str) -> IResult<&str, &str> {
         if c == ':' {
             // Peek to see if the next char is also a colon, and if not,
             // keep consuming.
-            if let Some((_, next_ch)) = iter.peek() {
-                if *next_ch != ':' {
-                    continue;
-                }
+            if let Some((_, next_ch)) = iter.peek()
+                && *next_ch != ':'
+            {
+                continue;
             }
         }
 
diff --git a/iox_query/Cargo.toml b/iox_query/Cargo.toml
index 54936c13..ad969a4e 100644
--- a/iox_query/Cargo.toml
+++ b/iox_query/Cargo.toml
@@ -29,7 +29,7 @@ datafusion_util = { path = "../datafusion_util" }
 executor = { path = "../executor" }
 futures = "0.3"
 hashbrown = { workspace = true }
-indexmap = { version = "2.10", features = ["std"] }
+indexmap = { version = "2.11", features = ["std"] }
 influxdb-line-protocol = { path = "../influxdb_line_protocol" }
 itertools = "0.13.0"
 iox_query_params = { path = "../iox_query_params" }
diff --git a/iox_query/src/exec/context.rs b/iox_query/src/exec/context.rs
index 4cd99051..a0f69bcf 100644
--- a/iox_query/src/exec/context.rs
+++ b/iox_query/src/exec/context.rs
@@ -661,11 +661,6 @@ impl IOxSessionContext {
         )
     }
 
-    /// Record an event on the span recorder
-    pub fn record_event(&mut self, name: &'static str) {
-        self.recorder.event(SpanEvent::new(name));
-    }
-
     /// Record an event on the span recorder
     pub fn set_metadata(&mut self, name: &'static str, value: impl Into<MetaValue>) {
         self.recorder.set_metadata(name, value);
diff --git a/iox_query/src/exec/gapfill/mod.rs b/iox_query/src/exec/gapfill/mod.rs
index 6b52ad48..88f846bd 100644
--- a/iox_query/src/exec/gapfill/mod.rs
+++ b/iox_query/src/exec/gapfill/mod.rs
@@ -35,7 +35,7 @@ use datafusion::{
 };
 use datafusion_util::ThenWithOpt;
 pub use gap_expander::{ExpandedValue, GapExpander};
-use std::cmp::Ordering;
+use std::{cmp::Ordering, slice};
 use std::{
     convert::Infallible,
     fmt::{self, Debug},
@@ -550,7 +550,7 @@ impl GapFillExec {
         let eq_properties = match input.properties().output_ordering() {
             None => EquivalenceProperties::new(schema),
             Some(output_ordering) => {
-                EquivalenceProperties::new_with_orderings(schema, &[output_ordering.clone()])
+                EquivalenceProperties::new_with_orderings(schema, slice::from_ref(output_ordering))
             }
         };
 
diff --git a/iox_query/src/logical_optimizer/influx_regex_to_datafusion_regex.rs b/iox_query/src/logical_optimizer/influx_regex_to_datafusion_regex.rs
index 7d90a1ac..6d43a14e 100644
--- a/iox_query/src/logical_optimizer/influx_regex_to_datafusion_regex.rs
+++ b/iox_query/src/logical_optimizer/influx_regex_to_datafusion_regex.rs
@@ -73,16 +73,15 @@ impl TreeNodeRewriter for InfluxRegexToDataFusionRegex {
                 let name = func.name();
                 if (args.len() == 2)
                     && ((name == REGEX_MATCH_UDF_NAME) || (name == REGEX_NOT_MATCH_UDF_NAME))
+                    && let Expr::Literal(ScalarValue::Utf8(Some(s)), _) = &args[1]
                 {
-                    if let Expr::Literal(ScalarValue::Utf8(Some(s)), _) = &args[1] {
-                        let s = clean_non_meta_escapes(s);
-                        let op = match name {
-                            REGEX_MATCH_UDF_NAME => Operator::RegexMatch,
-                            REGEX_NOT_MATCH_UDF_NAME => Operator::RegexNotMatch,
-                            _ => unreachable!(),
-                        };
-                        return Ok(Transformed::yes(binary_expr(args.remove(0), op, lit(s))));
-                    }
+                    let s = clean_non_meta_escapes(s);
+                    let op = match name {
+                        REGEX_MATCH_UDF_NAME => Operator::RegexMatch,
+                        REGEX_NOT_MATCH_UDF_NAME => Operator::RegexNotMatch,
+                        _ => unreachable!(),
+                    };
+                    return Ok(Transformed::yes(binary_expr(args.remove(0), op, lit(s))));
                 }
 
                 Ok(Transformed::yes(Expr::ScalarFunction(ScalarFunction {
diff --git a/iox_query/src/physical_optimizer/sort/merge_partitions.rs b/iox_query/src/physical_optimizer/sort/merge_partitions.rs
index 46bd3b0e..44cb8d4d 100644
--- a/iox_query/src/physical_optimizer/sort/merge_partitions.rs
+++ b/iox_query/src/physical_optimizer/sort/merge_partitions.rs
@@ -100,17 +100,16 @@ pub fn merge_partitions_after_parallelized_sorting(
                 } else {
                     // If all lexical ranges are the same, then the partitions are a result of repartitioning. Insert an SPM above the sort.
                     if let Some(lexical_ranges) = extract_ranges_from_plan(ordering_req, &ctx.plan)?
+                        && lexical_ranges.iter().dedup().collect_vec().len() == 1
                     {
-                        if lexical_ranges.iter().dedup().collect_vec().len() == 1 {
-                            let plan = add_sort_preserving_merge(
-                                Arc::clone(&ctx.plan),
-                                sort_exec.expr(),
-                                sort_exec.fetch(),
-                            )?;
-                            let mut new_ctx = MergePartitionsContext::new_default(plan);
-                            new_ctx.data.has_merged_parallelized_sort = true;
-                            return Ok(Transformed::yes(new_ctx));
-                        }
+                        let plan = add_sort_preserving_merge(
+                            Arc::clone(&ctx.plan),
+                            sort_exec.expr(),
+                            sort_exec.fetch(),
+                        )?;
+                        let mut new_ctx = MergePartitionsContext::new_default(plan);
+                        new_ctx.data.has_merged_parallelized_sort = true;
+                        return Ok(Transformed::yes(new_ctx));
                     };
 
                     Ok(Transformed::no(ctx))
diff --git a/iox_query/src/provider.rs b/iox_query/src/provider.rs
index 646a735d..17142b7d 100644
--- a/iox_query/src/provider.rs
+++ b/iox_query/src/provider.rs
@@ -310,6 +310,8 @@ impl TableProvider for ChunkTableProvider {
 
 #[cfg(test)]
 mod test {
+    use std::slice;
+
     use super::*;
     use crate::{
         exec::IOxSessionContext,
@@ -546,7 +548,7 @@ mod test {
 
         // simple plan
         let plan = provider
-            .scan(&state, None, &[pred.clone()], None)
+            .scan(&state, None, slice::from_ref(&pred), None)
             .await
             .unwrap();
         insta::assert_yaml_snapshot!(
@@ -563,7 +565,7 @@ mod test {
 
         // projection
         let plan = provider
-            .scan(&state, Some(&vec![1, 3]), &[pred.clone()], None)
+            .scan(&state, Some(&vec![1, 3]), slice::from_ref(&pred), None)
             .await
             .unwrap();
         insta::assert_yaml_snapshot!(
diff --git a/iox_query/src/provider/deduplicate.rs b/iox_query/src/provider/deduplicate.rs
index c63294a8..ea837c6f 100644
--- a/iox_query/src/provider/deduplicate.rs
+++ b/iox_query/src/provider/deduplicate.rs
@@ -1,7 +1,7 @@
 //! Implemention of DeduplicateExec operator (resolves primary key conflicts) plumbing and tests
 mod algo;
 
-use std::collections::HashMap;
+use std::{collections::HashMap, slice};
 use std::{collections::HashSet, fmt, sync::Arc};
 
 use arrow::{error::ArrowError, record_batch::RecordBatch};
@@ -189,7 +189,7 @@ impl DeduplicateExec {
     ) -> PlanProperties {
         trace!("Deduplicate output ordering: {:?}", sort_keys);
         let eq_properties =
-            EquivalenceProperties::new_with_orderings(input.schema(), &[sort_keys.clone()]);
+            EquivalenceProperties::new_with_orderings(input.schema(), slice::from_ref(sort_keys));
 
         let output_partitioning = Partitioning::UnknownPartitioning(1);
 
@@ -416,7 +416,7 @@ mod test {
     use arrow::array::{DictionaryArray, Int64Array};
     use arrow_util::display::pretty_format_batches;
     use schema::TIME_DATA_TIMEZONE;
-    use std::iter::FromIterator;
+    use std::{iter::FromIterator, slice};
 
     #[tokio::test]
     async fn test_single_tag() {
@@ -921,7 +921,7 @@ mod test {
             "|    |    | 1.0 |",
             "+----+----+-----+",
         ];
-        assert_batches_eq!(&expected_input_batch, &[b1.clone()]);
+        assert_batches_eq!(&expected_input_batch, slice::from_ref(&b1));
 
         // sort on t1, t2
         let sort_keys = vec![
@@ -1084,7 +1084,7 @@ mod test {
             "| b  |    | 1.0 |",
             "+----+----+-----+",
         ];
-        assert_batches_eq!(&expected_input_batch, &[b1.clone()]);
+        assert_batches_eq!(&expected_input_batch, slice::from_ref(&b1));
 
         // sort on t1, t2
         let sort_keys = vec![
@@ -1251,7 +1251,7 @@ mod test {
             "| b  | a  | 1.0 |",
             "+----+----+-----+",
         ];
-        assert_batches_eq!(&expected_input_batch, &[b1.clone()]);
+        assert_batches_eq!(&expected_input_batch, slice::from_ref(&b1));
 
         // sort on t1, t2
         let sort_keys = vec![
diff --git a/iox_query_influxql/Cargo.toml b/iox_query_influxql/Cargo.toml
index c5f5f124..e3a01c20 100644
--- a/iox_query_influxql/Cargo.toml
+++ b/iox_query_influxql/Cargo.toml
@@ -24,7 +24,7 @@ predicate = { path = "../predicate" }
 query_functions = { path = "../query_functions" }
 regex = "1"
 schema = { path = "../schema" }
-serde_json = "1.0.141"
+serde_json = "1.0.143"
 thiserror = "2.0"
 workspace-hack = { version = "0.1", path = "../workspace-hack" }
 
diff --git a/iox_query_influxql/src/frontend/planner.rs b/iox_query_influxql/src/frontend/planner.rs
index 3808e453..763487dc 100644
--- a/iox_query_influxql/src/frontend/planner.rs
+++ b/iox_query_influxql/src/frontend/planner.rs
@@ -6,12 +6,12 @@ use influxdb_influxql_parser::show_measurements::ShowMeasurementsStatement;
 use influxdb_influxql_parser::show_tag_keys::ShowTagKeysStatement;
 use influxdb_influxql_parser::show_tag_values::ShowTagValuesStatement;
 use iox_query_params::StatementParams;
-use std::any::Any;
 use std::collections::{HashMap, HashSet};
 use std::fmt;
 use std::fmt::Debug;
 use std::ops::Deref;
 use std::sync::Arc;
+use std::{any::Any, slice};
 
 use crate::plan::{InfluxQLToLogicalPlan, SchemaProvider, parse_regex};
 use datafusion::datasource::provider_as_source;
@@ -98,7 +98,7 @@ impl SchemaExec {
         let eq_properties = match input.properties().output_ordering() {
             None => EquivalenceProperties::new(schema),
             Some(output_ordering) => {
-                EquivalenceProperties::new_with_orderings(schema, &[output_ordering.clone()])
+                EquivalenceProperties::new_with_orderings(schema, slice::from_ref(output_ordering))
             }
         };
 
diff --git a/iox_query_influxql/src/plan/ir.rs b/iox_query_influxql/src/plan/ir.rs
index 74279e2a..94f9b557 100644
--- a/iox_query_influxql/src/plan/ir.rs
+++ b/iox_query_influxql/src/plan/ir.rs
@@ -85,9 +85,6 @@ pub(super) struct Select {
     ///
     /// [time_zone_clause]: https://docs.influxdata.com/influxdb/v1.8/query_language/explore-data/#the-time-zone-clause
     pub(super) timezone: Option<chrono_tz::Tz>,
-
-    /// `true` when the projection contains an `INTEGRAL` function.
-    pub(super) has_integral: bool,
 }
 
 impl From<Select> for SelectStatement {
diff --git a/iox_query_influxql/src/plan/planner.rs b/iox_query_influxql/src/plan/planner.rs
index 3e8195c5..51b25e24 100644
--- a/iox_query_influxql/src/plan/planner.rs
+++ b/iox_query_influxql/src/plan/planner.rs
@@ -13,14 +13,15 @@ use crate::plan::planner::source_field_names::SourceFieldNamesVisitor;
 use crate::plan::planner_time_range_expression::time_range_to_df_expr;
 use crate::plan::rewriter::{ProjectionType, find_table_names, rewrite_statement};
 use crate::plan::udf::{
-    cumulative_sum, derivative, difference, elapsed, find_integral_udfs, find_window_udfs,
-    integral, is_integral_udf, moving_average, non_negative_derivative, non_negative_difference,
+    INTEGRAL_UDF_NAME, cumulative_sum, derivative, difference, elapsed, find_integral_udfs,
+    find_window_udfs, integral, is_integral_udf, moving_average, non_negative_derivative,
+    non_negative_difference,
 };
 use crate::plan::util::{IQLSchema, binary_operator_to_df_operator, rebase_expr};
 use crate::plan::var_ref::var_ref_data_type_to_data_type;
 use crate::plan::{planner_rewrite_expression, udf};
 use crate::window::{
-    CUMULATIVE_SUM, DERIVATIVE, DIFFERENCE, ELAPSED, INTEGRAL, MOVING_AVERAGE,
+    CUMULATIVE_SUM, DERIVATIVE, DIFFERENCE, ELAPSED, INTEGRAL_WINDOW, MOVING_AVERAGE,
     NON_NEGATIVE_DERIVATIVE, NON_NEGATIVE_DIFFERENCE, PERCENT_ROW_NUMBER,
 };
 use arrow::array::{
@@ -208,9 +209,6 @@ struct Context<'a> {
     /// The set of tags specified in the top-level `SELECT` statement
     /// which represent the tag set used for grouping output.
     root_group_by_tags: &'a [&'a str],
-
-    /// `true` when the projection contains an `INTEGRAL` function.
-    has_integral: bool,
 }
 
 impl<'a> Context<'a> {
@@ -232,7 +230,6 @@ impl<'a> Context<'a> {
             interval: select.interval,
             extra_intervals: select.extra_intervals,
             root_group_by_tags,
-            has_integral: select.has_integral,
         }
     }
 
@@ -256,7 +253,6 @@ impl<'a> Context<'a> {
             interval: select.interval,
             extra_intervals: select.extra_intervals,
             root_group_by_tags: self.root_group_by_tags,
-            has_integral: select.has_integral,
         }
     }
 
@@ -271,14 +267,6 @@ impl<'a> Context<'a> {
         )
     }
 
-    /// Returns true if the current context has an extended
-    /// time range to provide leading data for window functions
-    /// to produce the result for the first window.
-    #[expect(dead_code)]
-    fn has_extended_time_range(&self) -> bool {
-        self.extra_intervals > 0 && self.interval.is_some()
-    }
-
     /// Return the time range of the context, including any
     /// additional intervals required for window functions like
     /// `difference` or `moving_average`, when the query contains a
@@ -704,6 +692,7 @@ impl<'a> InfluxQLToLogicalPlan<'a> {
                 .tag_names()
                 .map(|ident| ident.as_str())
                 .sorted()
+                .dedup()
                 .collect()
         } else {
             vec![]
@@ -1325,10 +1314,11 @@ impl<'a> InfluxQLToLogicalPlan<'a> {
     ) -> Result<(LogicalPlan, Vec<Expr>)> {
         // If SELECT contains INTEGRAL, go ahead and process it first.
         // See select_integral_window for details
-        if ctx.has_integral {
+        let num_integrals = find_integral_udfs(&select_exprs).len();
+        if num_integrals > 0 {
             (input, select_exprs) =
-                self.select_integral_window(ctx, input, select_exprs, group_by_tag_set)?;
-        }
+                self.select_integral_window(ctx, input, select_exprs, group_by_tag_set)?
+        };
         // Find a list of unique aggregate expressions from the projection.
         //
         // For example, a projection such as:
@@ -1513,7 +1503,14 @@ impl<'a> InfluxQLToLogicalPlan<'a> {
         let num_exprs = aggr_exprs.len();
         // this specifies how we should handle the empty values in the gapfill that we need to add
         // to handle the GROUP BY clause below (if one exists)
+        //
+        // InfluxQL docs state that INTEGRAL does not support FILL. However, the behavior in 1.x is
+        // more complex depending on the choice of fill option and the presence of other aggregates
+        // in the query.
         let fill_strategy = match fill_option {
+            // When the query contains all INTEGRAL aggregates, the query behaves as if the fill
+            // clause is `fill(none)` regardless of what the fill clause actually specifies.
+            _ if num_integrals == num_exprs => None,
             // If the user specified that nulls should be filled with a specific value, then we
             // need to take the value they gave us (`val`) and convert it to the correct type to
             // give to the gapfill
@@ -1549,6 +1546,22 @@ impl<'a> InfluxQLToLogicalPlan<'a> {
             ),
             // with these, we just fill everything in the same way.
             Some(FillClause::Previous) => Some(vec![FillStrategy::PrevNullAsMissing; num_exprs]),
+            // When INTEGRAL is used with other aggregates and `fill(linear)`, InfluxDB 1.0 fills
+            // the integral column with nulls instead of calculating linear interpolation.
+            Some(FillClause::Linear) if num_integrals > 0 => Some(
+                aggr_exprs
+                    .iter()
+                    .map(|expr| {
+                        Ok(if is_integral_aggr_expr(expr) {
+                            FillStrategy::Default(default_return_value_for_aggr_fn(
+                                expr, &schema, None,
+                            )?)
+                        } else {
+                            FillStrategy::LinearInterpolate
+                        })
+                    })
+                    .collect::<Result<Vec<_>>>()?,
+            ),
             Some(FillClause::Linear) => Some(vec![FillStrategy::LinearInterpolate; num_exprs]),
             // If they specified Fill(NONE), then we don't want to gapfill any values because the
             // `NONE` specifies that all rows with null values should be removed.
@@ -1574,7 +1587,7 @@ impl<'a> InfluxQLToLogicalPlan<'a> {
 
         // Combine the aggregate columns and group by expressions, which represents
         // the final projection from the aggregate operator.
-        let aggr_projection_exprs = [aggr_group_by_exprs, aggr_exprs].concat();
+        let aggr_projection_exprs = [aggr_group_by_exprs, aggr_exprs.clone()].concat();
 
         let fill_if_null = match fill_option {
             Some(FillClause::Value(v)) => Some(v),
@@ -1595,6 +1608,25 @@ impl<'a> InfluxQLToLogicalPlan<'a> {
             })
             .collect::<Result<Vec<Expr>>>()?;
 
+        // the integral window function produces null values to adhere to DataFusion's RecordBatch
+        // size invariant. To match 1.x behavior, we need to strip these nulls out when the query
+        // has a `GROUP BY time` and there are no other aggregate functions.
+        let plan = if num_integrals > 0
+            && num_integrals == num_exprs
+            && ctx.group_by.and_then(|gb| gb.time_dimension()).is_some()
+            && let Some(filter_nulls) = disjunction(
+                aggr_exprs
+                    .into_iter()
+                    .map(|expr| Ok(expr_as_column_expr(&expr, &plan)?.is_not_null()))
+                    .collect::<Result<Vec<Expr>>>()?,
+            ) {
+            LogicalPlanBuilder::from(plan)
+                .filter(filter_nulls)?
+                .build()?
+        } else {
+            plan
+        };
+
         Ok((plan, select_exprs_post_aggr))
     }
 
@@ -1967,7 +1999,7 @@ impl<'a> InfluxQLToLogicalPlan<'a> {
                 Expr::ScalarFunction(ScalarFunction { args, .. }) if is_integral_udf(e) => {
                     let alias = e.schema_name().to_string();
                     Ok(Expr::WindowFunction(Box::new(WindowFunction {
-                        fun: INTEGRAL.clone(),
+                        fun: INTEGRAL_WINDOW.clone(),
                         params: WindowFunctionParams {
                             args: vec![
                                 args[0].clone(),
@@ -4287,6 +4319,16 @@ fn remove_aggr_count_from_error(error: DataFusionError) -> DataFusionError {
     }
 }
 
+fn is_integral_aggr_expr(expr: &Expr) -> bool {
+    if let Expr::AggregateFunction(expr::AggregateFunction { func, params }) = expr
+        && func.name() == "sum"
+        && let [Expr::Column(Column { name, .. })] = params.args.as_slice()
+    {
+        return name.starts_with(&format!("{INTEGRAL_UDF_NAME}(")) && name.ends_with(")");
+    };
+    false
+}
+
 #[cfg(test)]
 mod tests {
     use super::*;
diff --git a/iox_query_influxql/src/plan/rewriter.rs b/iox_query_influxql/src/plan/rewriter.rs
index b82b31ed..f34d3d08 100644
--- a/iox_query_influxql/src/plan/rewriter.rs
+++ b/iox_query_influxql/src/plan/rewriter.rs
@@ -162,7 +162,6 @@ impl RewriteSelect {
         let SelectStatementInfo {
             projection_type,
             extra_intervals,
-            has_integral,
         } = select_statement_info(&fields, &group_by, stmt.fill)
             .map_err(|e| e.context("gather information about select statement"))?;
 
@@ -194,7 +193,6 @@ impl RewriteSelect {
             limit: stmt.limit,
             offset: stmt.offset,
             timezone: stmt.timezone.map(|v| *v),
-            has_integral,
         })
     }
 
@@ -279,14 +277,12 @@ impl RewriteSelect {
         let (fields, mut group_by) = if has_field_wildcard || has_group_by_wildcard {
             let (field_set, mut tag_set) = from_field_and_dimensions(s, from)?;
 
-            if !has_group_by_wildcard {
-                if let Some(group_by) = &stmt.group_by {
-                    // Remove any explicitly listed tags in the GROUP BY clause, so they are not
-                    // expanded by any wildcards specified in the SELECT projection list
-                    group_by.tag_names().for_each(|ident| {
-                        tag_set.remove(ident.as_str());
-                    });
-                }
+            if !has_group_by_wildcard && let Some(group_by) = &stmt.group_by {
+                // Remove any explicitly listed tags in the GROUP BY clause, so they are not
+                // expanded by any wildcards specified in the SELECT projection list
+                group_by.tag_names().for_each(|ident| {
+                    tag_set.remove(ident.as_str());
+                });
             }
 
             let fields = if has_field_wildcard {
@@ -987,9 +983,6 @@ struct FieldChecker {
     /// `true` when the projection contains a `DISTINCT` function or unary `DISTINCT` operator.
     has_distinct: bool,
 
-    /// `true` when the projection contains an `INTEGRAL` function.
-    has_integral: bool,
-
     /// Accumulator for the number of aggregate or window expressions for the statement.
     aggregate_count: usize,
 
@@ -1101,7 +1094,6 @@ impl FieldChecker {
         Ok(SelectStatementInfo {
             projection_type,
             extra_intervals: self.extra_intervals,
-            has_integral: self.has_integral,
         })
     }
 
@@ -1484,7 +1476,6 @@ impl FieldChecker {
 
     fn check_integral(&mut self, name: &str, args: &[Expr]) -> Result<()> {
         self.inc_aggregate_count();
-        self.has_integral = true;
         check_exp_args!(name, 1, 2, args);
 
         self.check_duration(name, args, 1)?;
@@ -1626,8 +1617,6 @@ struct SelectStatementInfo {
     ///
     /// [See also](Select::extra_intervals).
     extra_intervals: usize,
-    /// `true` when the projection contains an `INTEGRAL` function.
-    has_integral: bool,
 }
 
 /// Gather information about the semantics of a [`SelectStatement`] and verify
diff --git a/iox_query_influxql/src/plan/udf.rs b/iox_query_influxql/src/plan/udf.rs
index 37d9cb2a..f9988e7a 100644
--- a/iox_query_influxql/src/plan/udf.rs
+++ b/iox_query_influxql/src/plan/udf.rs
@@ -257,7 +257,7 @@ static NON_NEGATIVE_DIFFERENCE: LazyLock<Arc<ScalarUDF>> = LazyLock::new(|| {
     }))
 });
 
-const INTEGRAL_UDF_NAME: &str = "integral";
+pub(crate) const INTEGRAL_UDF_NAME: &str = "integral";
 
 #[derive(Debug)]
 struct IntegralUDF {
diff --git a/iox_query_influxql/src/window.rs b/iox_query_influxql/src/window.rs
index 8d90f0ec..4c6989e0 100644
--- a/iox_query_influxql/src/window.rs
+++ b/iox_query_influxql/src/window.rs
@@ -41,7 +41,7 @@ pub(crate) static ELAPSED: LazyLock<WindowFunctionDefinition> = LazyLock::new(||
 });
 
 /// Definition of the internal `INTEGRAL_WINDOW` user-defined window function.
-pub(crate) static INTEGRAL: LazyLock<WindowFunctionDefinition> = LazyLock::new(|| {
+pub(crate) static INTEGRAL_WINDOW: LazyLock<WindowFunctionDefinition> = LazyLock::new(|| {
     WindowFunctionDefinition::WindowUDF(Arc::new(WindowUDF::new_from_impl(
         integral::IntegralUDWF::new(),
     )))
diff --git a/iox_query_influxql/src/window/integral.rs b/iox_query_influxql/src/window/integral.rs
index 839e6477..5357b5f3 100644
--- a/iox_query_influxql/src/window/integral.rs
+++ b/iox_query_influxql/src/window/integral.rs
@@ -14,6 +14,26 @@ use datafusion::logical_expr::{
 use crate::delta_time;
 use crate::{NUMERICS, error};
 
+/// Takes an error message string and a list of ScalarValue variables, and constructs a format! call
+/// that includes the data types of the variables at the end of the message.
+///
+/// Example:
+/// ```ignore
+/// let value = ScalarValue::Int64(Some(42));
+/// let msg = format_column_types!("unsupported type", value);
+/// assert_eq!(msg, "unsupported type (value=Int64)");
+/// ```
+macro_rules! format_column_types {
+    ($msg:expr, $first:ident $(, $rest:ident)* $(,)?) => {
+        format!(
+            concat!($msg, " (", stringify!($first), "={}" $(, ", ", stringify!($rest), "={}")*, ")"),
+            $first.data_type() $(, $rest.data_type())*
+        )
+    };
+}
+
+const INTEGRAL_WINDOW_NAME: &str = "integral_window";
+
 #[derive(Debug)]
 pub(super) struct IntegralUDWF {
     signature: Signature,
@@ -60,7 +80,7 @@ impl WindowUDFImpl for IntegralUDWF {
     }
 
     fn name(&self) -> &str {
-        "integral"
+        INTEGRAL_WINDOW_NAME
     }
 
     fn signature(&self) -> &Signature {
@@ -137,61 +157,73 @@ impl PartitionEvaluator for TrapezoidalRulePartitionEvaluator {
         };
 
         // track the `GROUP BY time` window
-        let mut window_edge =
-            // when duration is zero, there is no `GROUP BY time` clause.
-            // set to null and ignore.
-            if duration == ZERO_DURATION {
-                ScalarValue::TimestampNanosecond(None, None)
+        let mut window_start;
+        let mut window_end;
+        // when duration is zero, there is no `GROUP BY time` clause.
+        // set to null and ignore.
+        if duration == ZERO_DURATION {
+            (window_start, window_end) = (
+                ScalarValue::TimestampNanosecond(None, None),
+                ScalarValue::TimestampNanosecond(None, None),
+            );
+        }
+        // otherwise calculate the first window bounds
+        else {
+            let window_bounds =
+                calc_window(&ScalarValue::try_from_array(&times, 0)?, &duration, &offset)?;
+            if ascending {
+                (window_start, window_end) = window_bounds;
+            } else {
+                (window_end, window_start) = window_bounds;
             }
-            // otherwise calculate the first window bounds
-            else {
-                let (window_start, window_end) =
-                    calc_window(&ScalarValue::try_from_array(&times, 0)?, &duration, &offset)?;
-                if ascending { window_end } else { window_start }
-            };
+        }
 
         // calculate all subsequent values
         for idx in 1..array.len() {
             let value = ScalarValue::try_from_array(&array, idx)?;
             let time = ScalarValue::try_from_array(&times, idx)?;
+
             // ignore null values and pass through to output
             if value.is_null() {
                 areas.push(ScalarValue::Float64(None));
                 continue;
             }
             // if timestamp is the same as last value, skip.
-            // we emit a zero to satisfy the DataFusion RecordBatch size invariant
+            // we emit a null to satisfy the DataFusion RecordBatch size invariant
             if last_time == time {
                 last_value = value.clone();
-                last_idx = idx;
-                areas.push(ScalarValue::Float64(Some(0.0)));
+                areas.push(ScalarValue::Float64(None));
                 continue;
             }
             // handle window boundary of `group by time`
             if duration != ZERO_DURATION
                 && (if ascending {
-                    time >= window_edge
+                    time >= window_end
                 } else {
-                    time <= window_edge
+                    time <= window_end
                 })
             {
                 // if the previous point is not on the window boundary, interpolate the area at the end
                 // of the window and add it to the area of the previous non-null point
-                if last_time != window_edge {
+                if last_time != window_end {
                     let value =
-                        calc_linear(&window_edge, (&last_value, &last_time), (&value, &time))?;
+                        calc_linear(&window_end, (&last_value, &last_time), (&value, &time))?;
                     areas[last_idx] = areas[last_idx].add(ScalarValue::Float64(Some(
                         0.5 * sum_values(&value, &last_value)?
-                            * delta_time(&window_edge, &last_time, &unit)?,
+                            * delta_time(&window_end, &last_time, &unit)?,
                     )))?;
                     // save end of this window as previous point, so that the first point of the
                     // new window will interpolate from the window boundary
+                    last_time = window_end.clone();
                     last_value = value.clone();
-                    last_time = window_edge.clone();
                 }
                 // calculate the next window
-                let (window_start, window_end) = calc_window(&time, &duration, &offset)?;
-                window_edge = if ascending { window_end } else { window_start };
+                let window_bounds = calc_window(&time, &duration, &offset)?;
+                if ascending {
+                    (window_start, window_end) = window_bounds;
+                } else {
+                    (window_end, window_start) = window_bounds;
+                };
             }
             //normal operation: calculate area and emit to output
             areas.push(ScalarValue::Float64(Some(
@@ -201,6 +233,10 @@ impl PartitionEvaluator for TrapezoidalRulePartitionEvaluator {
             last_time = time.clone();
             last_idx = idx;
         }
+        // if the last point is at the start time, we skip it because there is no area.
+        if last_time == window_start {
+            areas[last_idx] = ScalarValue::Float64(None);
+        }
         Ok(Arc::new(ScalarValue::iter_to_array(areas)?))
     }
 
@@ -228,19 +264,36 @@ fn calc_linear(
             ScalarValue::TimestampNanosecond(Some(prev_time), _),
             ScalarValue::TimestampNanosecond(Some(next_time), _),
         ) => (window_time, prev_time, next_time),
-        _ => return error::internal("unsupported time type for integral"),
+        _ => {
+            return error::internal(format_column_types!(
+                "unsupported time type for integral",
+                time,
+                prev_time,
+                next_time
+            ));
+        }
     };
     let prev_value = match prev_value {
         ScalarValue::Float64(Some(val)) => *val,
         ScalarValue::Int64(Some(val)) => *val as f64,
         ScalarValue::UInt64(Some(val)) => *val as f64,
-        _ => return error::internal("integral attempted on unsupported values"),
+        _ => {
+            return error::internal(format_column_types!(
+                "integral attempted on unsupported values",
+                prev_value
+            ));
+        }
     };
     let next_value = match next_value {
         ScalarValue::Float64(Some(val)) => *val,
         ScalarValue::Int64(Some(val)) => *val as f64,
         ScalarValue::UInt64(Some(val)) => *val as f64,
-        _ => return error::internal("integral attempted on unsupported values"),
+        _ => {
+            return error::internal(format_column_types!(
+                "integral attempted on unsupported values",
+                next_value
+            ));
+        }
     };
     // compute y = mx + b
     let m = (next_value - prev_value) / ((next_time - prev_time) as f64);
@@ -258,13 +311,22 @@ fn calc_window(
     offset: &ScalarValue,
 ) -> Result<(ScalarValue, ScalarValue)> {
     let ScalarValue::TimestampNanosecond(Some(time), tz) = time else {
-        return error::internal("unsupported time type for integral window calculation");
+        return error::internal(format_column_types!(
+            "unsupported time type for integral window calculation",
+            time
+        ));
     };
     let ScalarValue::DurationNanosecond(Some(offset)) = offset else {
-        return error::internal("unsupported offset type for integral window calculation");
+        return error::internal(format_column_types!(
+            "unsupported offset type for integral window calculation",
+            offset
+        ));
     };
     let ScalarValue::DurationNanosecond(Some(duration)) = duration else {
-        return error::internal("unsupported offset type for integral window calculation");
+        return error::internal(format_column_types!(
+            "unsupported duration type for integral window calculation",
+            duration
+        ));
     };
     // subtract the offset to the time so we calculate the correct base interval
     let time = time - offset;
@@ -286,11 +348,49 @@ fn calc_window(
 
 /// Computes a sum of two numeric [ScalarValue]s as 64-bit floating point numbers.
 fn sum_values(value: &ScalarValue, last_value: &ScalarValue) -> Result<f64> {
-    match value
-        .cast_to(&DataType::Float64)?
-        .add(last_value.cast_to(&DataType::Float64)?)?
-    {
-        ScalarValue::Float64(Some(val)) => Ok(val),
-        _ => error::internal("integral sum expected to be a float"),
+    let value = match value {
+        ScalarValue::Float64(Some(val)) => *val,
+        ScalarValue::Int64(Some(val)) => *val as f64,
+        ScalarValue::UInt64(Some(val)) => *val as f64,
+        _ => {
+            return error::internal(format_column_types!(
+                "integral attempted on unsupported values",
+                value
+            ));
+        }
+    };
+    let last_value = match last_value {
+        ScalarValue::Float64(Some(val)) => *val,
+        ScalarValue::Int64(Some(val)) => *val as f64,
+        ScalarValue::UInt64(Some(val)) => *val as f64,
+        _ => {
+            return error::internal(format_column_types!(
+                "integral attempted on unsupported values",
+                last_value
+            ));
+        }
+    };
+    Ok(value + last_value)
+}
+
+#[cfg(test)]
+mod tests {
+    use datafusion::common::ScalarValue;
+
+    #[test]
+    fn test_format_column_types_macro() {
+        // Test with one variable
+        let value = ScalarValue::Int64(Some(42));
+        let msg1 = format_column_types!("unsupported type", value);
+        assert_eq!(msg1, "unsupported type (value=Int64)");
+
+        // Test with two variables
+        let prev_value = ScalarValue::Float64(Some(3.5));
+        let msg2 = format_column_types!("unsupported types", value, prev_value);
+        assert_eq!(msg2, "unsupported types (value=Int64, prev_value=Float64)");
+
+        // Test with trailing comma
+        let msg3 = format_column_types!("unsupported types", value, prev_value,);
+        assert_eq!(msg3, "unsupported types (value=Int64, prev_value=Float64)");
     }
 }
diff --git a/iox_system_tables/Cargo.toml b/iox_system_tables/Cargo.toml
index ef19f0a9..527cede7 100644
--- a/iox_system_tables/Cargo.toml
+++ b/iox_system_tables/Cargo.toml
@@ -7,7 +7,7 @@ license.workspace = true
 
 [dependencies]
 arrow.workspace = true
-async-trait = "0.1.88"
+async-trait = "0.1.89"
 datafusion.workspace = true
 futures = "0.3"
 workspace-hack = { version = "0.1", path = "../workspace-hack" }
diff --git a/jemalloc_stats/Cargo.toml b/jemalloc_stats/Cargo.toml
index f80eb244..44918295 100644
--- a/jemalloc_stats/Cargo.toml
+++ b/jemalloc_stats/Cargo.toml
@@ -8,7 +8,7 @@ license.workspace = true
 [dependencies]
 snafu = "0.8"
 tikv-jemalloc-ctl = { version = "0.5.4", features = ["use_std"] }
-tokio = { version = "1.47.0", features = ["rt", "sync", "time"] }
+tokio = { version = "1.47.1", features = ["rt", "sync", "time"] }
 workspace-hack = { version = "0.1", path = "../workspace-hack" }
 
 [lints]
@@ -18,4 +18,4 @@ workspace = true
 tikv-jemallocator = { version = "0.5", features = [
     "unprefixed_malloc_on_supported_platforms",
 ] }
-tokio = { version = "1.47.0", features = ["macros", "rt-multi-thread"] }
+tokio = { version = "1.47.1", features = ["macros", "rt-multi-thread"] }
diff --git a/meta_data_cache/Cargo.toml b/meta_data_cache/Cargo.toml
index 7c3cc2fa..d87af7a7 100644
--- a/meta_data_cache/Cargo.toml
+++ b/meta_data_cache/Cargo.toml
@@ -22,7 +22,7 @@ futures = { version = "0.3.31" }
 [dev-dependencies]
 arrow_util = { path = "../arrow_util" }
 bytes = "1.10"
-tokio = { version = "1.47.0", default-features = false }
+tokio = { version = "1.47.1", default-features = false }
 uuid = { version = "1", features = ["v4"] }
 
 [lints]
diff --git a/meta_data_cache/src/lib.rs b/meta_data_cache/src/lib.rs
index 9f0bac8d..c46eade5 100644
--- a/meta_data_cache/src/lib.rs
+++ b/meta_data_cache/src/lib.rs
@@ -169,34 +169,32 @@ impl MetaIndexCache {
     ) -> Result<Arc<FileMetas>, DynError> {
         let cache_column_stats = self.cache_column_stats;
         let arrow_reader_options = arrow_reader_options.cloned();
-        let (res, _state) = self
-            .file_index
-            .get_or_fetch(
-                file_uuid,
-                Box::new(move || {
-                    async move {
-                        let parquet_metadata = reader
-                            .get_metadata(arrow_reader_options.as_ref())
-                            .await
-                            .map_err(|e| Arc::new(e) as DynError)?;
-                        // get statistics from metadata
-                        let col_metas = cache_column_stats
-                            .then(|| {
-                                statistics_from_parquet_meta_calc(&parquet_metadata, table_schema)
-                                    .map(ColStats::from_statistics)
-                                    .ok()
-                            })
-                            .flatten();
-                        Ok(Arc::new(FileMetas {
-                            col_metas,
-                            parquet_metadata,
-                        }))
-                    }
-                    .boxed()
-                }),
-            )
-            .await;
-        res
+        let (res, _, _state) = self.file_index.get_or_fetch(
+            file_uuid,
+            Box::new(move || {
+                async move {
+                    let parquet_metadata = reader
+                        .get_metadata(arrow_reader_options.as_ref())
+                        .await
+                        .map_err(|e| Arc::new(e) as DynError)?;
+                    // get statistics from metadata
+                    let col_metas = cache_column_stats
+                        .then(|| {
+                            statistics_from_parquet_meta_calc(&parquet_metadata, table_schema)
+                                .map(ColStats::from_statistics)
+                                .ok()
+                        })
+                        .flatten();
+                    Ok(Arc::new(FileMetas {
+                        col_metas,
+                        parquet_metadata,
+                    }))
+                }
+                .boxed()
+            }),
+            (),
+        );
+        res.await
     }
 
     /// return number of cache hits
@@ -714,22 +712,20 @@ mod tests {
         parquet_1: impl Into<Arc<ParquetMetaData>> + Send + 'static,
         file_stats_1: Statistics,
     ) -> Arc<FileMetas> {
-        let (res, _state) = meta_index
-            .file_index
-            .get_or_fetch(
-                file_uuid,
-                Box::new(|| {
-                    async move {
-                        Ok(Arc::new(FileMetas {
-                            parquet_metadata: parquet_1.into(),
-                            col_metas: Some(ColStats::from_statistics(file_stats_1)),
-                        }))
-                    }
-                    .boxed()
-                }),
-            )
-            .await;
-        res.unwrap()
+        let (res, _, _state) = meta_index.file_index.get_or_fetch(
+            file_uuid,
+            Box::new(|| {
+                async move {
+                    Ok(Arc::new(FileMetas {
+                        parquet_metadata: parquet_1.into(),
+                        col_metas: Some(ColStats::from_statistics(file_stats_1)),
+                    }))
+                }
+                .boxed()
+            }),
+            (),
+        );
+        res.await.unwrap()
     }
 
     #[tokio::test]
diff --git a/metric/src/duration.rs b/metric/src/duration.rs
index 6fd9750f..6126ff5b 100644
--- a/metric/src/duration.rs
+++ b/metric/src/duration.rs
@@ -147,6 +147,17 @@ impl DurationHistogramOptions {
     pub fn new(thresholds: impl IntoIterator<Item = Duration>) -> Self {
         let mut buckets: Vec<_> = thresholds.into_iter().collect();
         buckets.sort_unstable();
+        buckets.windows(2).for_each(|window| {
+            let (lower, upper) = (window[0], window[1]);
+            assert!(lower != upper, "thresholds must be unique");
+        });
+        assert!(
+            buckets
+                .last()
+                .map(|last| last == &DURATION_MAX)
+                .unwrap_or_default(),
+            "last bucket must be DURATION_MAX (not the same as Duration::MAX!)",
+        );
         Self { buckets }
     }
 }
@@ -263,8 +274,9 @@ mod tests {
     }
 
     #[test]
-    #[should_panic(expected = "cannot fit duration into u64: TryFromIntError(())")]
+    #[should_panic(expected = "last bucket must be DURATION_MAX")]
     fn test_bucket_overflow() {
+        // Duration::MAX is larger than DURATION_MAX
         let options = DurationHistogramOptions::new([Duration::MAX]);
         DurationHistogram::create(&options);
     }
@@ -328,4 +340,43 @@ mod tests {
             )
         );
     }
+
+    #[test]
+    fn test_histogram_option_sorts_input() {
+        let options = DurationHistogramOptions::new([
+            DURATION_MAX,
+            Duration::from_nanos(1),
+            Duration::from_nanos(3),
+        ]);
+        assert_eq!(
+            options.buckets,
+            &[
+                Duration::from_nanos(1),
+                Duration::from_nanos(3),
+                DURATION_MAX,
+            ]
+        );
+    }
+
+    #[test]
+    #[should_panic(expected = "thresholds must be unique")]
+    fn test_histogram_option_panic_with_duplicates() {
+        DurationHistogramOptions::new([
+            Duration::from_nanos(1),
+            DURATION_MAX,
+            Duration::from_nanos(1),
+        ]);
+    }
+
+    #[test]
+    #[should_panic(expected = "last bucket must be DURATION_MAX")]
+    fn test_histogram_option_panic_empty() {
+        DurationHistogramOptions::new(std::iter::empty());
+    }
+
+    #[test]
+    #[should_panic(expected = "last bucket must be DURATION_MAX")]
+    fn test_histogram_option_panic_no_duration_max() {
+        DurationHistogramOptions::new([Duration::from_nanos(1), Duration::from_nanos(3)]);
+    }
 }
diff --git a/metric/src/histogram.rs b/metric/src/histogram.rs
index 752feda3..924a1ee0 100644
--- a/metric/src/histogram.rs
+++ b/metric/src/histogram.rs
@@ -16,6 +16,17 @@ impl U64HistogramOptions {
     pub fn new(thresholds: impl IntoIterator<Item = u64>) -> Self {
         let mut buckets: Vec<_> = thresholds.into_iter().collect();
         buckets.sort_unstable();
+        buckets.windows(2).for_each(|window| {
+            let (lower, upper) = (window[0], window[1]);
+            assert!(lower != upper, "thresholds must be unique");
+        });
+        assert!(
+            buckets
+                .last()
+                .map(|last| last == &u64::MAX)
+                .unwrap_or_default(),
+            "last bucket must be u64::MAX",
+        );
         Self { buckets }
     }
 }
@@ -162,11 +173,11 @@ mod tests {
 
     #[test]
     fn test_histogram() {
-        let buckets = [20, 40, 50];
+        let buckets = [20, 40, 50, u64::MAX];
         let options = U64HistogramOptions::new(buckets);
         let histogram = U64Histogram::create(&options);
 
-        let buckets = |expected: &[u64; 3], total: u64| -> Observation {
+        let buckets = |expected: &[u64; 4], total: u64| -> Observation {
             Observation::U64Histogram(HistogramObservation {
                 total,
                 buckets: expected
@@ -178,25 +189,25 @@ mod tests {
             })
         };
 
-        assert_eq!(histogram.observe(), buckets(&[0, 0, 0], 0));
+        assert_eq!(histogram.observe(), buckets(&[0, 0, 0, 0], 0));
 
         histogram.record(30);
 
-        assert_eq!(histogram.observe(), buckets(&[0, 1, 0], 30));
+        assert_eq!(histogram.observe(), buckets(&[0, 1, 0, 0], 30));
 
         histogram.record(50);
 
-        assert_eq!(histogram.observe(), buckets(&[0, 1, 1], 80));
+        assert_eq!(histogram.observe(), buckets(&[0, 1, 1, 0], 80));
 
         histogram.record(51);
 
-        // Exceeds max bucket - ignored
-        assert_eq!(histogram.observe(), buckets(&[0, 1, 1], 80));
+        // max bucket
+        assert_eq!(histogram.observe(), buckets(&[0, 1, 1, 1], 131));
 
         histogram.record(0);
         histogram.record(0);
 
-        assert_eq!(histogram.observe(), buckets(&[2, 1, 1], 80));
+        assert_eq!(histogram.observe(), buckets(&[2, 1, 1, 1], 131));
 
         // Now test the percentile reporting function
         let options = U64HistogramOptions::new(vec![0, 1, 2, 4, 8, 16, 32, u64::MAX]);
@@ -254,4 +265,28 @@ mod tests {
         assert_eq!(histogram.percentile(49), 1);
         assert_eq!(histogram.percentile(50), 2);
     }
+
+    #[test]
+    fn test_histogram_option_sorts_input() {
+        let options = U64HistogramOptions::new([u64::MAX, 1, 2]);
+        assert_eq!(options.buckets, &[1, 2, u64::MAX]);
+    }
+
+    #[test]
+    #[should_panic(expected = "thresholds must be unique")]
+    fn test_histogram_option_panic_with_duplicates() {
+        U64HistogramOptions::new([3, u64::MAX, 3]);
+    }
+
+    #[test]
+    #[should_panic(expected = "last bucket must be u64::MAX")]
+    fn test_histogram_option_panic_empty() {
+        U64HistogramOptions::new(std::iter::empty());
+    }
+
+    #[test]
+    #[should_panic(expected = "last bucket must be u64::MAX")]
+    fn test_histogram_option_panic_no_duration_max() {
+        U64HistogramOptions::new([1, 3]);
+    }
 }
diff --git a/metric_exporters/src/lib.rs b/metric_exporters/src/lib.rs
index 9a6ff385..038d833d 100644
--- a/metric_exporters/src/lib.rs
+++ b/metric_exporters/src/lib.rs
@@ -215,6 +215,11 @@ impl PushGatewayClient {
         format!("{}/metrics/job/{}", self.address, self.job_name)
     }
 
+    /// Get the address of the PushGateway server.
+    pub fn address(&self) -> &str {
+        &self.address
+    }
+
     /// Push the metrics stored in the internal [`Registry`] to the configured server.
     pub async fn push_metrics(&self) -> Result<(), Box<dyn std::error::Error>> {
         let mut buf = Vec::new();
@@ -282,7 +287,7 @@ mod tests {
 
         let histogram: Metric<U64Histogram> =
             registry.register_metric_with_options("bar", "a histogram metric", || {
-                U64HistogramOptions::new([5, 10, 50])
+                U64HistogramOptions::new([5, 10, 50, u64::MAX])
             });
 
         let histogram_r1 = histogram.recorder(&[("tag1", "value1")]);
@@ -324,13 +329,13 @@ mod tests {
 bar_bucket{tag1="value1",le="5"} 1
 bar_bucket{tag1="value1",le="10"} 2
 bar_bucket{tag1="value1",le="50"} 3
-bar_bucket{tag1="value1",le="+Inf"} 3
+bar_bucket{tag1="value1",le="inf"} 3
 bar_sum{tag1="value1"} 53
 bar_count{tag1="value1"} 3
 bar_bucket{tag1="value2",le="5"} 0
 bar_bucket{tag1="value2",le="10"} 1
 bar_bucket{tag1="value2",le="50"} 2
-bar_bucket{tag1="value2",le="+Inf"} 2
+bar_bucket{tag1="value2",le="inf"} 2
 bar_sum{tag1="value2"} 48
 bar_count{tag1="value2"} 2
 # HELP duration_counter_seconds_total a duration counter
diff --git a/mutable_batch_lp/src/lib.rs b/mutable_batch_lp/src/lib.rs
index 6d098654..8330b136 100644
--- a/mutable_batch_lp/src/lib.rs
+++ b/mutable_batch_lp/src/lib.rs
@@ -367,6 +367,8 @@ pub mod test_helpers {
 
 #[cfg(test)]
 mod tests {
+    use std::slice;
+
     use super::*;
     use ::test_helpers::assert_error;
     use arrow_util::assert_batches_eq;
@@ -504,7 +506,7 @@ m f1=10i 1639612800000000000
                 "|     | 10 | 2021-12-16T00:00:00Z |",
                 "+-----+----+----------------------+",
             ],
-            &[batch.clone()]
+            slice::from_ref(&batch)
         );
 
         // Verify the nullness of the string column ("" not the same as null)
@@ -542,7 +544,7 @@ m b=t 1639612800000000000
                 "| true |   | 2021-12-16T00:00:00Z |   |",
                 "+------+---+----------------------+---+",
             ],
-            &[batch.clone()]
+            slice::from_ref(&batch)
         );
 
         // Verify the nullness of the int column
diff --git a/object_store_mem_cache/Cargo.toml b/object_store_mem_cache/Cargo.toml
index bcab343a..be94e16b 100644
--- a/object_store_mem_cache/Cargo.toml
+++ b/object_store_mem_cache/Cargo.toml
@@ -6,13 +6,13 @@ edition.workspace = true
 license.workspace = true
 
 [dependencies]
-async-trait = { version = "0.1.88", default-features = false }
+async-trait = { version = "0.1.89", default-features = false }
 bincode.workspace = true
 bytes = { version = "1.10.1", default-features = false }
 dashmap = "6.1.0"
 data_types = { path = "../data_types" }
 futures = { version = "0.3.31" }
-indexmap = { version = "2.10", features = ["std"] }
+indexmap = { version = "2.11", features = ["std"] }
 iox_time = { path = "../iox_time" }
 metric = { path = "../metric" }
 object_store.workspace = true
@@ -20,7 +20,7 @@ object_store_metrics = { path = "../object_store_metrics" }
 object_store_mock = { path = "../object_store_mock" }
 object_store_size_hinting = { path = "../object_store_size_hinting" }
 tracing = { workspace = true }
-tokio = { version = "1.47.0", default-features = false }
+tokio = { version = "1.47.1", default-features = false }
 tracker = { path = "../tracker" }
 workspace-hack = { version = "0.1", path = "../workspace-hack" }
 
diff --git a/object_store_mem_cache/src/cache_system/mod.rs b/object_store_mem_cache/src/cache_system/mod.rs
index b4844d9a..79658433 100644
--- a/object_store_mem_cache/src/cache_system/mod.rs
+++ b/object_store_mem_cache/src/cache_system/mod.rs
@@ -114,16 +114,31 @@ where
 type CacheFn<V> = Box<dyn FnOnce() -> BoxFuture<'static, CacheRequestResult<V>> + Send>;
 
 #[async_trait]
-pub trait Cache<K, V>: Send + Sync + Debug
+pub trait Cache<K, V, D>: Send + Sync + Debug
 where
     K: Clone + Eq + Hash + Send + Sync + 'static,
     V: Clone + HasSize + Send + Sync + 'static,
+    D: Clone + Send + Sync + 'static,
 {
     /// Get an existing key or start a new fetch process.
     ///
     /// Fetching is driven by a background tokio task and will make progress even when you do not poll the resulting
     /// future.
-    async fn get_or_fetch(&self, k: &K, f: CacheFn<V>) -> (CacheRequestResult<V>, CacheState);
+    ///
+    /// Returns a future that resolves to the value [`CacheRequestResult<V>`].
+    /// If data is loading, provides early access data (`D`).
+    ///
+    /// The early access data (`D`) may be used by metrics, logging, or other purposes.
+    fn get_or_fetch(
+        &self,
+        k: &K,
+        f: CacheFn<V>,
+        d: D,
+    ) -> (
+        BoxFuture<'static, CacheRequestResult<V>>,
+        Option<D>,
+        CacheState,
+    );
 
     /// Get the cached value and return `None` if was not cached.
     ///
diff --git a/object_store_mem_cache/src/cache_system/s3_fifo_cache/mod.rs b/object_store_mem_cache/src/cache_system/s3_fifo_cache/mod.rs
index 241a0641..85b86f0d 100644
--- a/object_store_mem_cache/src/cache_system/s3_fifo_cache/mod.rs
+++ b/object_store_mem_cache/src/cache_system/s3_fifo_cache/mod.rs
@@ -1,4 +1,5 @@
 use async_trait::async_trait;
+use futures::future::BoxFuture;
 use object_store_metrics::cache_state::CacheState;
 use std::{
     fmt::Debug,
@@ -208,31 +209,64 @@ where
             S3CacheResponse::NewEntry(load)
         }
     }
+
+    /// Returns an iterator of all keys currently in the [`S3Fifo`] cache.
+    ///
+    /// Note that the keys listed in the cache are those which have returned from the
+    /// [`CacheFn`] function, i.e. they are the keys that have been successfully fetched.
+    pub fn list(&self) -> impl Iterator<Item = Arc<K>> {
+        self.cache.keys()
+    }
 }
 
 #[async_trait]
-impl<K, V> Cache<K, V> for S3FifoCache<K, V, ()>
+impl<K, V, D> Cache<K, V, D> for S3FifoCache<K, V, D>
 where
     K: Clone + Debug + Eq + Hash + HasSize + Send + Sync + 'static,
     V: Clone + Debug + HasSize + Send + Sync + 'static,
+    D: Clone + Debug + Send + Sync + 'static,
 {
-    async fn get_or_fetch(&self, k: &K, f: CacheFn<V>) -> (CacheRequestResult<V>, CacheState) {
-        match self.get_or_fetch_impl(k, f, ()) {
-            S3CacheResponse::NewEntry(fut) => {
-                let res = fut.await;
-
-                // Due to the lock gap between the "unresolved futures" and the cache, the future may determine that
-                // data was already cached/loading. We try to read the from the inner state.
-                match res {
-                    Ok(v) => (Ok(v), CacheState::NewEntry),
-                    Err(e) => (Err(e), CacheState::NewEntry),
-                }
+    /// Get an existing key or start a new fetch process.
+    ///
+    /// Returns a future that resolves to the value [`CacheRequestResult<V>`].
+    /// If data is loading, provides early access data (`D`).
+    ///
+    /// For a given key, this function will return a value immediately if it is already cached.
+    /// If it is not cached and not already loading, it will start a new fetch process
+    /// using the early access data (`D`) provided by the caller.
+    ///
+    /// If a fetch process is already in progress, it will return a different early access (`D`)
+    /// which is tied to the ongoing fetch process.
+    fn get_or_fetch(
+        &self,
+        k: &K,
+        f: CacheFn<V>,
+        d: D,
+    ) -> (
+        BoxFuture<'static, CacheRequestResult<V>>,
+        Option<D>,
+        CacheState,
+    ) {
+        match self.get_or_fetch_impl(k, f, d) {
+            S3CacheResponse::NewEntry(load) => {
+                let early_access = load.data().clone();
+                let fut = load.into_future();
+
+                (Box::pin(fut), Some(early_access), CacheState::NewEntry)
+            }
+            S3CacheResponse::AlreadyLoading(load) => {
+                let early_access = load.data().clone();
+                let fut = load.into_future();
+
+                (
+                    Box::pin(fut),
+                    Some(early_access),
+                    CacheState::AlreadyLoading,
+                )
             }
-            S3CacheResponse::AlreadyLoading(fut) => {
-                let res = fut.await;
-                (res, CacheState::AlreadyLoading)
+            S3CacheResponse::WasCached(res) => {
+                (Box::pin(async move { res }), None, CacheState::WasCached)
             }
-            S3CacheResponse::WasCached(res) => (res, CacheState::WasCached),
         }
     }
 
@@ -255,6 +289,8 @@ where
 
 #[cfg(test)]
 mod tests {
+    use core::panic;
+
     use super::*;
 
     use crate::cache_system::{
@@ -286,27 +322,25 @@ mod tests {
         );
         let k1 = Arc::from("x");
 
-        let (res, state) = cache
-            .get_or_fetch(
-                &k1,
-                Box::new(|| futures::future::ready(Ok(Arc::from("value"))).boxed()),
-            )
-            .await;
+        let (res, _, state) = cache.get_or_fetch(
+            &k1,
+            Box::new(|| futures::future::ready(Ok(Arc::from("value"))).boxed()),
+            (),
+        );
         assert_eq!(state, CacheState::NewEntry);
-        res.unwrap();
+        res.await.unwrap();
 
         assert_ne!(Arc::strong_count(&k1), 1);
 
         for i in 0..100 {
             let k = Arc::from(i.to_string());
-            let (res, state) = cache
-                .get_or_fetch(
-                    &k,
-                    Box::new(|| futures::future::ready(Ok(Arc::from("value"))).boxed()),
-                )
-                .await;
+            let (res, _, state) = cache.get_or_fetch(
+                &k,
+                Box::new(|| futures::future::ready(Ok(Arc::from("value"))).boxed()),
+                (),
+            );
             assert_eq!(state, CacheState::NewEntry);
-            res.unwrap();
+            res.await.unwrap();
         }
 
         assert_eq!(Arc::strong_count(&k1), 1);
@@ -329,13 +363,12 @@ mod tests {
 
         // make it heavy
         for _ in 0..2 {
-            let (res, _state) = cache
-                .get_or_fetch(
-                    &k_heavy,
-                    Box::new(|| futures::future::ready(Ok(Arc::new(TestValue(5)))).boxed()),
-                )
-                .await;
-            res.unwrap();
+            let (res, _, _state) = cache.get_or_fetch(
+                &k_heavy,
+                Box::new(|| futures::future::ready(Ok(Arc::new(TestValue(5)))).boxed()),
+                (),
+            );
+            res.await.unwrap();
         }
 
         // add new keys
@@ -343,13 +376,12 @@ mod tests {
 
         // make them heavy enough to evict old data
         for _ in 0..2 {
-            let (res, _state) = cache
-                .get_or_fetch(
-                    &k_new,
-                    Box::new(|| futures::future::ready(Ok(Arc::new(TestValue(5)))).boxed()),
-                )
-                .await;
-            res.unwrap();
+            let (res, _, _state) = cache.get_or_fetch(
+                &k_new,
+                Box::new(|| futures::future::ready(Ok(Arc::new(TestValue(5)))).boxed()),
+                (),
+            );
+            res.await.unwrap();
         }
 
         // old heavy key is gone
@@ -372,7 +404,7 @@ mod tests {
     fn setup() -> TestSetup {
         let observer = Arc::new(TestHook::default());
         TestSetup {
-            cache: Arc::new(S3FifoCache::new(
+            cache: Arc::new(S3FifoCache::<_, _, ()>::new(
                 S3Config {
                     max_memory_size: 10_000,
                     max_ghost_memory_size: 10_000,
@@ -456,13 +488,12 @@ mod tests {
         // Insert all test data
         for (key, value) in &test_data {
             let value_clone = value.clone();
-            let (res, _) = cache
-                .get_or_fetch(
-                    key,
-                    Box::new(move || async move { Ok(value_clone) }.boxed()),
-                )
-                .await;
-            res.unwrap();
+            let (res, _, _state) = cache.get_or_fetch(
+                key,
+                Box::new(move || async move { Ok(value_clone) }.boxed()),
+                (),
+            );
+            res.await.unwrap();
         }
 
         // Create snapshot
@@ -569,13 +600,12 @@ mod tests {
         // Insert all test data
         for (key, value) in &test_data {
             let value_clone = value.clone();
-            let (res, _) = cache
-                .get_or_fetch(
-                    key,
-                    Box::new(move || async move { Ok(value_clone) }.boxed()),
-                )
-                .await;
-            res.unwrap();
+            let (res, _, _state) = cache.get_or_fetch(
+                key,
+                Box::new(move || async move { Ok(value_clone) }.boxed()),
+                (),
+            );
+            res.await.unwrap();
         }
 
         // Create snapshot
@@ -668,4 +698,161 @@ mod tests {
             "Restored cache should have 1 ghost entry"
         );
     }
+
+    #[tokio::test]
+    async fn test_get_or_fetch_with_early_access() {
+        let cache = S3FifoCache::<Arc<str>, Arc<str>, Arc<str>>::new(
+            S3Config {
+                max_memory_size: 1000,
+                max_ghost_memory_size: 500,
+                move_to_main_threshold: 0.1,
+                hook: Arc::new(NoOpHook::default()),
+            },
+            &metric::Registry::new(),
+        );
+
+        let key = Arc::from("test_key");
+        let early_access_data = Arc::from("early_data");
+        let final_value = Arc::from("final_value");
+
+        /* Test case 1: New entry - should return future and early access data */
+        let final_value_clone = Arc::clone(&final_value);
+        let (got_fut, got_early_access, got_state) = cache.get_or_fetch(
+            &key,
+            Box::new(move || {
+                let value = Arc::clone(&final_value_clone);
+                async move {
+                    // Simulate some async work
+                    tokio::time::sleep(std::time::Duration::from_millis(100)).await;
+                    Ok(value)
+                }
+                .boxed()
+            }),
+            Arc::clone(&early_access_data),
+        );
+
+        // Verify return signature for new entry
+        assert_eq!(got_state, CacheState::NewEntry);
+        assert!(matches!(got_early_access, Some(e) if Arc::ptr_eq(&e, &early_access_data)));
+
+        // Await the future and verify it returns the expected value
+        let result = got_fut.await;
+        assert!(result.is_ok());
+        assert_eq!(result.unwrap(), final_value);
+
+        /* Test case 2: Already cached - should return immediate result with no early access */
+        let (got_fut, got_early_access, got_state) = cache.get_or_fetch(
+            &key,
+            Box::new(|| async { panic!("should not be called") }.boxed()),
+            Arc::from("unused_early_data"),
+        );
+
+        // Verify return signature for cached entry
+        assert_eq!(got_state, CacheState::WasCached);
+        assert!(got_early_access.is_none());
+
+        // Await the future and verify it returns the cached value
+        let result = got_fut.await;
+        assert!(result.is_ok());
+        assert_eq!(result.unwrap(), final_value);
+
+        /* Test case 3: Already loading - simulate concurrent access */
+        let key = Arc::from("new_test_key");
+        let early_access_data = Arc::from("new_early_data");
+        let final_value = Arc::from("new_final_value");
+
+        // Start first request (this will be loading)
+        let final_value_clone = Arc::clone(&final_value);
+        let (got_fut_1, got_early_access_1, got_state_1) = cache.get_or_fetch(
+            &key,
+            Box::new(move || {
+                let value = Arc::clone(&final_value_clone);
+                async move {
+                    // Simulate longer async work
+                    tokio::time::sleep(std::time::Duration::from_millis(100)).await;
+                    Ok(value)
+                }
+                .boxed()
+            }),
+            Arc::clone(&early_access_data),
+        );
+
+        // Start second request while first is still loading
+        let different_early_access = Arc::from("different_early_data");
+        let (got_fut_2, got_early_access_2, state_2) = cache.get_or_fetch(
+            &key,
+            Box::new(|| async { panic!("should not be called") }.boxed()),
+            different_early_access,
+        );
+
+        // Verify return signatures
+        assert_eq!(got_state_1, CacheState::NewEntry);
+        assert!(matches!(got_early_access_1, Some(e) if Arc::ptr_eq(&e, &early_access_data)));
+
+        assert_eq!(state_2, CacheState::AlreadyLoading);
+        // The second request should get the early access data from the ongoing load
+        assert!(matches!(got_early_access_2, Some(e) if Arc::ptr_eq(&e, &early_access_data)));
+
+        // Both futures should resolve to the same value
+        let (result1, result2) = tokio::join!(got_fut_1, got_fut_2);
+        assert!(result1.is_ok());
+        assert!(result2.is_ok());
+        assert_eq!(result1.unwrap(), final_value);
+        assert_eq!(result2.unwrap(), final_value);
+    }
+
+    #[tokio::test]
+    async fn test_list_fn_only_includes_fully_loaded_entries() {
+        let cache = S3FifoCache::<Arc<str>, Arc<str>, ()>::new(
+            S3Config {
+                max_memory_size: 1000,
+                max_ghost_memory_size: 500,
+                move_to_main_threshold: 0.1,
+                hook: Arc::new(NoOpHook::default()),
+            },
+            &metric::Registry::new(),
+        );
+
+        let key1 = Arc::from("key1".to_string());
+        let key2 = Arc::from("key2".to_string());
+
+        // Add first entry
+        let (res1, _, _) = cache.get_or_fetch(
+            &key1,
+            Box::new(|| futures::future::ready(Ok(Arc::from("value1"))).boxed()),
+            (),
+        );
+        res1.await.unwrap();
+
+        // Add second entry
+        let (res2, _, _) = cache.get_or_fetch(
+            &key2,
+            Box::new(|| {
+                async move {
+                    tokio::time::sleep(std::time::Duration::from_secs(1)).await;
+                    Ok(Arc::from("value2"))
+                }
+                .boxed()
+            }),
+            (),
+        );
+
+        // List keys in the cache
+        let keys: Vec<Arc<str>> = cache.list().map(Arc::unwrap_or_clone).collect();
+        assert_eq!(keys.len(), 1);
+        assert!(keys.contains(&key1), "key1 should be in the cache");
+        assert!(
+            !keys.contains(&key2),
+            "key2 should not be in the cache::list() yet, since still loading"
+        );
+
+        // wait until second entry is loaded
+        res2.await.unwrap();
+
+        // Now both keys should be in the cache::list()
+        let keys: Vec<Arc<str>> = cache.list().map(Arc::unwrap_or_clone).collect();
+        assert_eq!(keys.len(), 2);
+        assert!(keys.contains(&key1), "key1 should be in the cache");
+        assert!(keys.contains(&key2), "key2 should be in the cache");
+    }
 }
diff --git a/object_store_mem_cache/src/cache_system/s3_fifo_cache/s3_fifo.rs b/object_store_mem_cache/src/cache_system/s3_fifo_cache/s3_fifo.rs
index ffb936cc..0480e343 100644
--- a/object_store_mem_cache/src/cache_system/s3_fifo_cache/s3_fifo.rs
+++ b/object_store_mem_cache/src/cache_system/s3_fifo_cache/s3_fifo.rs
@@ -305,6 +305,11 @@ where
         self.entries.is_empty()
     }
 
+    /// Returns an iterator of all keys currently in the cache.
+    pub fn keys(&self) -> impl Iterator<Item = Arc<K>> {
+        self.entries.iter().map(|entry| Arc::clone(entry.key()))
+    }
+
     /// Create a snapshot of the locked state.
     ///
     /// This function serializes the [`S3Fifo`] inner state using bincode, allowing for
diff --git a/object_store_mem_cache/src/cache_system/test_utils.rs b/object_store_mem_cache/src/cache_system/test_utils.rs
index a0637635..e6fea736 100644
--- a/object_store_mem_cache/src/cache_system/test_utils.rs
+++ b/object_store_mem_cache/src/cache_system/test_utils.rs
@@ -52,7 +52,7 @@ pub(crate) async fn test_happy_path(setup: TestSetup) {
     let barrier = Arc::new(Barrier::new(2));
     let barrier_captured = Arc::clone(&barrier);
     let k1 = Arc::new("k1");
-    let mut fut = std::pin::pin!(cache.get_or_fetch(
+    let (mut fut, _, state) = cache.get_or_fetch(
         &k1,
         Box::new(move || {
             async move {
@@ -60,12 +60,13 @@ pub(crate) async fn test_happy_path(setup: TestSetup) {
                 Ok(Arc::new(TestValue(test_size)))
             }
             .boxed()
-        })
-    ));
+        }),
+        (),
+    );
     fut.assert_pending().await;
     assert_eq!(observer.records(), vec![TestHookRecord::Insert(0, "k1")],);
 
-    let ((res, state), _) = tokio::join!(fut, barrier.wait());
+    let (res, _) = tokio::join!(fut, barrier.wait());
     assert_eq!(state, CacheState::NewEntry);
     assert_eq!(res.unwrap(), Arc::new(TestValue(test_size)));
     assert_eq!(
@@ -92,7 +93,7 @@ pub(crate) async fn test_panic_loader(setup: TestSetup) {
     let barrier = Arc::new(Barrier::new(2));
     let barrier_captured = Arc::clone(&barrier);
     let k1 = Arc::new("k1");
-    let mut fut = std::pin::pin!(cache.get_or_fetch(
+    let (mut fut, _, state) = cache.get_or_fetch(
         &k1,
         Box::new(|| {
             async move {
@@ -100,12 +101,13 @@ pub(crate) async fn test_panic_loader(setup: TestSetup) {
                 panic!("foo")
             }
             .boxed()
-        })
-    ));
+        }),
+        (),
+    );
     fut.assert_pending().await;
     assert_eq!(observer.records(), vec![TestHookRecord::Insert(0, "k1")],);
 
-    let ((res, state), _) = tokio::join!(fut, barrier.wait());
+    let (res, _) = tokio::join!(fut, barrier.wait());
     assert_eq!(state, CacheState::NewEntry);
     assert_eq!(res.unwrap_err().to_string(), "panic: foo");
 
@@ -128,7 +130,7 @@ pub(crate) async fn test_error_path_loader(setup: TestSetup) {
     let barrier = Arc::new(Barrier::new(2));
     let barrier_captured = Arc::clone(&barrier);
     let k1 = Arc::new("k1");
-    let mut fut = std::pin::pin!(cache.get_or_fetch(
+    let (mut fut, _, state) = cache.get_or_fetch(
         &k1,
         Box::new(|| {
             async move {
@@ -136,12 +138,13 @@ pub(crate) async fn test_error_path_loader(setup: TestSetup) {
                 Err(str_err("my error"))
             }
             .boxed()
-        })
-    ));
+        }),
+        (),
+    );
     fut.assert_pending().await;
     assert_eq!(observer.records(), vec![TestHookRecord::Insert(0, "k1")],);
 
-    let ((res, state), _) = tokio::join!(fut, barrier.wait());
+    let (res, _) = tokio::join!(fut, barrier.wait());
     assert_eq!(state, CacheState::NewEntry);
     assert_eq!(res.unwrap_err().to_string(), "my error");
 
@@ -165,14 +168,13 @@ pub(crate) async fn test_get_keeps_key_alive(setup: TestSetup) {
     let test_size_hook = test_size + S3_FIFO_EXTRA_SIZE;
 
     let k1 = Arc::new("k1");
-    let (res, state) = cache
-        .get_or_fetch(
-            &k1,
-            Box::new(move || async move { Ok(Arc::new(TestValue(test_size))) }.boxed()),
-        )
-        .await;
+    let (fut, _, state) = cache.get_or_fetch(
+        &k1,
+        Box::new(move || async move { Ok(Arc::new(TestValue(test_size))) }.boxed()),
+        (),
+    );
     assert_eq!(state, CacheState::NewEntry);
-    assert_eq!(res.unwrap(), Arc::new(TestValue(test_size)));
+    assert_eq!(fut.await.unwrap(), Arc::new(TestValue(test_size)));
     assert_eq!(
         observer.records(),
         vec![
@@ -190,14 +192,13 @@ pub(crate) async fn test_get_keeps_key_alive(setup: TestSetup) {
         ]
     );
 
-    let (res, state) = cache
-        .get_or_fetch(
-            &k1,
-            Box::new(move || async move { Ok(Arc::new(TestValue(test_size))) }.boxed()),
-        )
-        .await;
+    let (fut, _, state) = cache.get_or_fetch(
+        &k1,
+        Box::new(move || async move { Ok(Arc::new(TestValue(test_size))) }.boxed()),
+        (),
+    );
     assert_eq!(state, CacheState::WasCached);
-    assert_eq!(res.unwrap(), Arc::new(TestValue(test_size)));
+    assert_eq!(fut.await.unwrap(), Arc::new(TestValue(test_size)));
 
     cache.prune();
     assert_eq!(
@@ -219,7 +220,7 @@ pub(crate) async fn test_already_loading(setup: TestSetup) {
     let barrier = Arc::new(Barrier::new(2));
     let barrier_captured = Arc::clone(&barrier);
     let k1 = Arc::new("k1");
-    let mut fut_1 = std::pin::pin!(cache.get_or_fetch(
+    let (mut fut_1, _, state_1) = cache.get_or_fetch(
         &k1,
         Box::new(move || {
             async move {
@@ -227,23 +228,25 @@ pub(crate) async fn test_already_loading(setup: TestSetup) {
                 Ok(Arc::new(TestValue(test_size_1)))
             }
             .boxed()
-        })
-    ));
+        }),
+        (),
+    );
     fut_1.assert_pending().await;
     assert_eq!(observer.records(), vec![TestHookRecord::Insert(0, "k1")],);
 
-    let mut fut_2 = std::pin::pin!(cache.get_or_fetch(
+    let (mut fut_2, _, state_2) = cache.get_or_fetch(
         &k1,
-        Box::new(move || { { async move { Ok(Arc::new(TestValue(test_size_2))) } }.boxed() })
-    ));
+        Box::new(move || { async move { Ok(Arc::new(TestValue(test_size_2))) } }.boxed()),
+        (),
+    );
     fut_2.assert_pending().await;
 
-    let (_, (fut_res, state)) = tokio::join!(barrier.wait(), fut_1);
-    assert_eq!(state, CacheState::NewEntry);
+    let (_, fut_res) = tokio::join!(barrier.wait(), fut_1);
+    assert_eq!(state_1, CacheState::NewEntry);
     assert_eq!(fut_res.unwrap(), Arc::new(TestValue(test_size_1)));
 
-    let (fut_res, state) = fut_2.await;
-    assert_eq!(state, CacheState::AlreadyLoading);
+    let fut_res = fut_2.await;
+    assert_eq!(state_2, CacheState::AlreadyLoading);
     assert_eq!(fut_res.unwrap(), Arc::new(TestValue(test_size_1)));
 
     assert_eq!(
@@ -262,7 +265,7 @@ pub(crate) async fn test_drop_while_load_blocked(setup: TestSetup) {
     {
         let barrier_captured = Arc::clone(&barrier);
         let k1 = Arc::new("k1");
-        let mut fut = std::pin::pin!(cache.get_or_fetch(
+        let (mut fut, _, _state) = cache.get_or_fetch(
             &k1,
             Box::new(move || {
                 {
@@ -273,8 +276,9 @@ pub(crate) async fn test_drop_while_load_blocked(setup: TestSetup) {
                     }
                 }
                 .boxed()
-            })
-        ));
+            }),
+            (),
+        );
         fut.assert_pending().await;
     }
 
@@ -292,7 +296,7 @@ pub(crate) async fn test_perfect_waking_one_consumer(setup: TestSetup) {
     let barriers = Arc::new((0..N_IO_STEPS).map(|_| Barrier::new(2)).collect::<Vec<_>>());
     let barriers_captured = Arc::clone(&barriers);
     let k1 = Arc::new("k1");
-    let mut fut = cache.get_or_fetch(
+    let (mut fut, _, state) = cache.get_or_fetch(
         &k1,
         Box::new(|| {
             async move {
@@ -303,6 +307,7 @@ pub(crate) async fn test_perfect_waking_one_consumer(setup: TestSetup) {
             }
             .boxed()
         }),
+        (),
     );
     fut.assert_pending().await;
     assert_eq!(observer.records(), vec![TestHookRecord::Insert(0, "k1")],);
@@ -319,7 +324,7 @@ pub(crate) async fn test_perfect_waking_one_consumer(setup: TestSetup) {
 
     // Don't use `tokio::select!` or `tokio::join!` because they poll too often. What the H?!
     // So we use this lovely crate instead: https://crates.io/crates/futures-concurrency
-    let ((res, state), ()) = fut.join(fut_io).await;
+    let (res, ()) = fut.join(fut_io).await;
     assert_eq!(state, CacheState::NewEntry);
     assert_eq!(res.unwrap(), Arc::new(TestValue(1001)),);
 
@@ -340,7 +345,7 @@ pub(crate) async fn test_perfect_waking_two_consumers(setup: TestSetup) {
     let barriers = Arc::new((0..N_IO_STEPS).map(|_| Barrier::new(2)).collect::<Vec<_>>());
     let barriers_captured = Arc::clone(&barriers);
     let k1 = Arc::new("k1");
-    let mut fut_1 = cache.get_or_fetch(
+    let (mut fut_1, _, state_1) = cache.get_or_fetch(
         &k1,
         Box::new(|| {
             async move {
@@ -351,13 +356,13 @@ pub(crate) async fn test_perfect_waking_two_consumers(setup: TestSetup) {
             }
             .boxed()
         }),
+        (),
     );
     fut_1.assert_pending().await;
     assert_eq!(observer.records(), vec![TestHookRecord::Insert(0, "k1")],);
 
-    let mut fut_2 = cache
-        .get_or_fetch(&k1, Box::new(|| async move { unreachable!() }.boxed()))
-        .boxed();
+    let (mut fut_2, _, state_2) =
+        cache.get_or_fetch(&k1, Box::new(|| async move { unreachable!() }.boxed()), ());
     fut_2.assert_pending().await;
     assert_eq!(observer.records(), vec![TestHookRecord::Insert(0, "k1")],);
 
@@ -375,7 +380,7 @@ pub(crate) async fn test_perfect_waking_two_consumers(setup: TestSetup) {
 
     // Don't use `tokio::select!` or `tokio::join!` because they poll too often. What the H?!
     // So we use this lovely crate instead: https://crates.io/crates/futures-concurrency
-    let (((res_1, state_1), (res_2, state_2)), ()) = fut_1.join(fut_2).join(fut_io).await;
+    let ((res_1, res_2), ()) = fut_1.join(fut_2).join(fut_io).await;
     assert_eq!(state_1, CacheState::NewEntry);
     assert_eq!(state_2, CacheState::AlreadyLoading);
     assert_eq!(res_1.unwrap(), Arc::new(TestValue(1001)),);
@@ -402,25 +407,20 @@ pub(crate) fn runtime_shutdown(setup: TestSetup) {
     let barrier = Arc::new(Barrier::new(2));
     let barrier_captured = Arc::clone(&barrier);
     let cache_captured = &cache;
-    let mut fut = rt_1
-        .block_on(async move {
-            Box::new(async move {
-                let k1 = Arc::new("k1");
-                cache_captured
-                    .get_or_fetch(
-                        &k1,
-                        Box::new(|| {
-                            async move {
-                                barrier_captured.wait().await;
-                                panic!("foo")
-                            }
-                            .boxed()
-                        }),
-                    )
-                    .await
-            })
-        })
-        .boxed();
+    let (mut fut, _, _state) = rt_1.block_on(async move {
+        let k1 = Arc::new("k1");
+        cache_captured.get_or_fetch(
+            &k1,
+            Box::new(|| {
+                async move {
+                    barrier_captured.wait().await;
+                    panic!("foo")
+                }
+                .boxed()
+            }),
+            (),
+        )
+    });
     rt_1.block_on(async {
         fut.assert_pending().await;
     });
@@ -432,7 +432,7 @@ pub(crate) fn runtime_shutdown(setup: TestSetup) {
         .unwrap();
     let err = rt_2
         .block_on(async move {
-            let ((res, _), _) = tokio::join!(fut, barrier.wait());
+            let (res, _) = tokio::join!(fut, barrier.wait());
             res
         })
         .unwrap_err();
@@ -455,7 +455,7 @@ pub(crate) async fn test_get_ok(setup: TestSetup) {
 
     let barrier = Arc::new(Barrier::new(2));
     let barrier_captured = Arc::clone(&barrier);
-    let mut fut = std::pin::pin!(cache.get_or_fetch(
+    let (mut fut, _, state) = cache.get_or_fetch(
         &k1,
         Box::new(move || {
             async move {
@@ -463,8 +463,9 @@ pub(crate) async fn test_get_ok(setup: TestSetup) {
                 Ok(Arc::new(TestValue(test_size)))
             }
             .boxed()
-        })
-    ));
+        }),
+        (),
+    );
     fut.assert_pending().await;
     assert_eq!(observer.records(), vec![TestHookRecord::Insert(0, "k1")],);
 
@@ -472,7 +473,7 @@ pub(crate) async fn test_get_ok(setup: TestSetup) {
     assert!(cache.get(&k1).is_none());
     assert_eq!(observer.records(), vec![TestHookRecord::Insert(0, "k1")],);
 
-    let (_, (fut_res, state)) = tokio::join!(barrier.wait(), fut);
+    let (_, fut_res) = tokio::join!(barrier.wait(), fut);
     assert_eq!(state, CacheState::NewEntry);
     assert_eq!(fut_res.unwrap(), Arc::new(TestValue(test_size)));
     assert_eq!(
@@ -530,7 +531,7 @@ pub(crate) async fn test_get_err(setup: TestSetup) {
 
     let barrier = Arc::new(Barrier::new(2));
     let barrier_captured = Arc::clone(&barrier);
-    let mut fut = std::pin::pin!(cache.get_or_fetch(
+    let (mut fut, _, state) = cache.get_or_fetch(
         &k1,
         Box::new(|| {
             async move {
@@ -538,8 +539,9 @@ pub(crate) async fn test_get_err(setup: TestSetup) {
                 Err(str_err("err"))
             }
             .boxed()
-        })
-    ));
+        }),
+        (),
+    );
     fut.assert_pending().await;
     assert_eq!(observer.records(), vec![TestHookRecord::Insert(0, "k1")],);
 
@@ -547,7 +549,7 @@ pub(crate) async fn test_get_err(setup: TestSetup) {
     assert!(cache.get(&k1).is_none());
     assert_eq!(observer.records(), vec![TestHookRecord::Insert(0, "k1")],);
 
-    let (_, (fut_res, state)) = tokio::join!(barrier.wait(), fut);
+    let (_, fut_res) = tokio::join!(barrier.wait(), fut);
     assert_eq!(state, CacheState::NewEntry);
     assert_eq!(fut_res.unwrap_err().to_string(), "err");
 
@@ -575,23 +577,21 @@ pub(crate) async fn test_hook_gen(setup: TestSetup) {
     let k1 = Arc::new("k1");
     let k2 = Arc::new("k2");
 
-    let (res, state) = cache
-        .get_or_fetch(
-            &k1,
-            Box::new(move || async move { Ok(Arc::new(TestValue(test_size_1))) }.boxed()),
-        )
-        .await;
+    let (res, _, state) = cache.get_or_fetch(
+        &k1,
+        Box::new(move || async move { Ok(Arc::new(TestValue(test_size_1))) }.boxed()),
+        (),
+    );
     assert_eq!(state, CacheState::NewEntry);
-    assert_eq!(res.unwrap(), Arc::new(TestValue(test_size_1)));
+    assert_eq!(res.await.unwrap(), Arc::new(TestValue(test_size_1)));
 
-    let (res, state) = cache
-        .get_or_fetch(
-            &k2,
-            Box::new(move || async move { Ok(Arc::new(TestValue(test_size_2))) }.boxed()),
-        )
-        .await;
+    let (res, _, state) = cache.get_or_fetch(
+        &k2,
+        Box::new(move || async move { Ok(Arc::new(TestValue(test_size_2))) }.boxed()),
+        (),
+    );
     assert_eq!(state, CacheState::NewEntry);
-    assert_eq!(res.unwrap(), Arc::new(TestValue(test_size_2)));
+    assert_eq!(res.await.unwrap(), Arc::new(TestValue(test_size_2)));
 
     assert_eq!(
         observer.records(),
@@ -605,7 +605,7 @@ pub(crate) async fn test_hook_gen(setup: TestSetup) {
 }
 
 pub(crate) struct TestSetup {
-    pub(crate) cache: Arc<dyn Cache<&'static str, Arc<TestValue>>>,
+    pub(crate) cache: Arc<dyn Cache<&'static str, Arc<TestValue>, ()>>,
     pub(crate) observer: Arc<TestHook<&'static str>>,
 }
 
diff --git a/object_store_mem_cache/src/store.rs b/object_store_mem_cache/src/store.rs
index c5df8d42..c61f14e5 100644
--- a/object_store_mem_cache/src/store.rs
+++ b/object_store_mem_cache/src/store.rs
@@ -126,7 +126,7 @@ impl MemCacheObjectStoreParams<'_> {
             s3_fifo_ghost_memory_limit,
         } = self;
 
-        let cache = Arc::new(S3FifoCache::new(
+        let cache = Arc::new(S3FifoCache::<_, _, ()>::new(
             S3Config {
                 max_memory_size: memory_limit.get(),
                 max_ghost_memory_size: s3_fifo_ghost_memory_limit.get(),
@@ -152,7 +152,7 @@ impl MemCacheObjectStoreParams<'_> {
 pub struct MemCacheObjectStore {
     store: Arc<DynObjectStore>,
     hit_metrics: HitMetrics,
-    cache: Arc<dyn Cache<Path, Arc<CacheValue>>>,
+    cache: Arc<dyn Cache<Path, Arc<CacheValue>, ()>>,
 }
 
 impl MemCacheObjectStore {
@@ -163,21 +163,20 @@ impl MemCacheObjectStore {
     ) -> Result<(Arc<CacheValue>, CacheState)> {
         let captured_store = Arc::clone(&self.store);
         let captured_location = Arc::new(location.clone());
-        let (res, state) = self
-            .cache
-            .get_or_fetch(
-                &Arc::clone(&captured_location),
-                Box::new(move || {
-                    async move {
-                        CacheValue::fetch(&captured_store, &captured_location, size_hint)
-                            .await
-                            .map_err(|e| Arc::new(e) as _)
-                            .map(Arc::new)
-                    }
-                    .boxed()
-                }),
-            )
-            .await;
+        let (res, _, state) = self.cache.get_or_fetch(
+            &Arc::clone(&captured_location),
+            Box::new(move || {
+                async move {
+                    CacheValue::fetch(&captured_store, &captured_location, size_hint)
+                        .await
+                        .map_err(|e| Arc::new(e) as _)
+                        .map(Arc::new)
+                }
+                .boxed()
+            }),
+            (),
+        );
+        let res = res.await;
 
         match state {
             CacheState::WasCached => &self.hit_metrics.cached,
diff --git a/object_store_metrics/Cargo.toml b/object_store_metrics/Cargo.toml
index cd48d070..fc899b69 100644
--- a/object_store_metrics/Cargo.toml
+++ b/object_store_metrics/Cargo.toml
@@ -9,7 +9,7 @@ license.workspace = true
 workspace = true
 
 [dependencies] # In alphabetical order
-async-trait = "0.1.88"
+async-trait = "0.1.89"
 bloom2 = "0.5.1"
 bytes = "1.10"
 futures = "0.3"
@@ -28,6 +28,6 @@ insta = { version = "1", features = ["yaml"] }
 object_store_mem_cache = { path = "../object_store_mem_cache" }
 object_store_mock = { version = "0.1", path = "../object_store_mock" }
 rust_decimal = "1.37.2"
-tempfile = "3.20.0"
+tempfile = "3.21.0"
 test_helpers = { path = "../test_helpers" }
 tokio = { version = "1.47", features = ["macros", "io-util"] }
diff --git a/object_store_mock/Cargo.toml b/object_store_mock/Cargo.toml
index 4d6f966e..af5b0c83 100644
--- a/object_store_mock/Cargo.toml
+++ b/object_store_mock/Cargo.toml
@@ -8,11 +8,11 @@ license.workspace = true
 # See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html
 
 [dependencies]
-async-trait = { version = "0.1.88", default-features = false }
+async-trait = { version = "0.1.89", default-features = false }
 bytes = { version = "1.10.1", default-features = false }
 futures = { version = "0.3.31" }
 object_store.workspace = true
-tokio = { version = "1.47.0", default-features = false, features = [
+tokio = { version = "1.47.1", default-features = false, features = [
     "macros",
     "rt-multi-thread",
 ] }
diff --git a/predicate/src/lib.rs b/predicate/src/lib.rs
index 799af749..d0b51dda 100644
--- a/predicate/src/lib.rs
+++ b/predicate/src/lib.rs
@@ -5,8 +5,6 @@ pub mod rpc_predicate;
 
 use data_types::TimestampRange;
 use datafusion::{
-    common::tree_node::{TreeNodeRecursion, TreeNodeVisitor},
-    error::DataFusionError,
     logical_expr::{BinaryExpr, binary_expr},
     prelude::{Expr, col},
 };
@@ -362,12 +360,10 @@ impl TryFrom<Expr> for ValueExpr {
             op: _,
             right: _,
         }) = &expr
+            && let Expr::Column(inner) = left.as_ref()
+            && inner.name == VALUE_COLUMN_NAME
         {
-            if let Expr::Column(inner) = left.as_ref()
-                && inner.name == VALUE_COLUMN_NAME
-            {
-                return Ok(Self { expr });
-            }
+            return Ok(Self { expr });
         }
         Err(expr)
     }
@@ -391,75 +387,6 @@ impl From<ValueExpr> for Expr {
     }
 }
 
-/// Recursively walk an expression tree, checking if the expression is
-/// row-based.
-///
-/// A row-based function takes one row in and produces
-/// one value as output.
-///
-/// Note that even though a predicate expression  like `col < 5` can be used to
-/// filter rows, the expression itself is row-based (produces a single boolean).
-///
-/// Examples of non row based expressions are Aggregate and
-/// Window function which produce different cardinality than their
-/// input.
-struct RowBasedVisitor {
-    row_based: bool,
-}
-
-impl Default for RowBasedVisitor {
-    fn default() -> Self {
-        Self { row_based: true }
-    }
-}
-
-impl TreeNodeVisitor<'_> for RowBasedVisitor {
-    type Node = Expr;
-
-    fn f_down(&mut self, expr: &Expr) -> Result<TreeNodeRecursion, DataFusionError> {
-        match expr {
-            Expr::Alias(_)
-            | Expr::Between { .. }
-            | Expr::BinaryExpr { .. }
-            | Expr::Case { .. }
-            | Expr::Cast { .. }
-            | Expr::Column(_)
-            | Expr::Exists { .. }
-            | Expr::InList { .. }
-            | Expr::InSubquery { .. }
-            | Expr::IsFalse(_)
-            | Expr::IsNotFalse(_)
-            | Expr::IsNotNull(_)
-            | Expr::IsNotTrue(_)
-            | Expr::IsNotUnknown(_)
-            | Expr::IsNull(_)
-            | Expr::IsTrue(_)
-            | Expr::IsUnknown(_)
-            | Expr::Like { .. }
-            | Expr::Literal(_, _)
-            | Expr::Negative(_)
-            | Expr::Not(_)
-            | Expr::OuterReferenceColumn(_, _)
-            | Expr::Placeholder { .. }
-            | Expr::ScalarFunction { .. }
-            | Expr::ScalarSubquery(_)
-            | Expr::ScalarVariable(_, _)
-            | Expr::SimilarTo { .. }
-            | Expr::TryCast { .. } => Ok(TreeNodeRecursion::Continue),
-            // Exhaustive matching requires us to also match deprecated variants
-            #[expect(deprecated)]
-            Expr::Wildcard { .. } => Ok(TreeNodeRecursion::Continue),
-            Expr::AggregateFunction { .. }
-            | Expr::GroupingSet(_)
-            | Expr::WindowFunction { .. }
-            | Expr::Unnest(_) => {
-                self.row_based = false;
-                Ok(TreeNodeRecursion::Stop)
-            }
-        }
-    }
-}
-
 #[cfg(test)]
 mod tests {
     use super::*;
diff --git a/predicate/src/rpc_predicate.rs b/predicate/src/rpc_predicate.rs
index 3ebe41bc..5663b1af 100644
--- a/predicate/src/rpc_predicate.rs
+++ b/predicate/src/rpc_predicate.rs
@@ -532,7 +532,6 @@ mod tests {
             .unwrap()
     }
 
-    #[expect(dead_code)]
     const fn assert_send<T: Send>() {}
 
     // `InfluxRpcPredicate` shall be `Send`, otherwise we will have problems constructing plans for InfluxRPC
diff --git a/predicate/src/rpc_predicate/rewrite.rs b/predicate/src/rpc_predicate/rewrite.rs
index a78c837d..d88a0293 100644
--- a/predicate/src/rpc_predicate/rewrite.rs
+++ b/predicate/src/rpc_predicate/rewrite.rs
@@ -107,10 +107,9 @@ fn simplify_predicate_inner(expr: Expr) -> Result<Transformed<Expr>> {
                     return Ok(Transformed::yes(*right));
                 }
             } else if let (Some(coll), Some(colr)) = (is_col_op_lit(&left), is_col_not_null(&right))
+                && colr == coll
             {
-                if colr == coll {
-                    return Ok(Transformed::yes(*left));
-                }
+                return Ok(Transformed::yes(*left));
             };
 
             Ok(Transformed::no(Expr::BinaryExpr(BinaryExpr {
diff --git a/rust-toolchain.toml b/rust-toolchain.toml
index 7855e6d5..908d2ecb 100644
--- a/rust-toolchain.toml
+++ b/rust-toolchain.toml
@@ -1,3 +1,3 @@
 [toolchain]
-channel = "1.88.0"
+channel = "1.89.0"
 components = ["rustfmt", "clippy"]
diff --git a/tracker/Cargo.toml b/tracker/Cargo.toml
index 72fac426..b1fe4708 100644
--- a/tracker/Cargo.toml
+++ b/tracker/Cargo.toml
@@ -19,7 +19,7 @@ tracing = { workspace = true }
 parking_lot = "0.12"
 pin-project = "1.1"
 # Delaying upgrade until <https://github.com/GuillaumeGomez/sysinfo/issues/1496> is fixed
-sysinfo = "<0.37"
+sysinfo = "<0.38"
 tokio = { version = "1.47", features = ["macros", "parking_lot", "sync", "time"] }
 tokio-util = { version = "0.7.15" }
 trace = { path = "../trace"}
diff --git a/tracker/src/lock.rs b/tracker/src/lock.rs
index 427ca4be..d01032e4 100644
--- a/tracker/src/lock.rs
+++ b/tracker/src/lock.rs
@@ -152,7 +152,6 @@ pub struct InstrumentedRawLock<R: Sized> {
 unsafe impl<R: lock_api::RawRwLock + Sized> lock_api::RawRwLock for InstrumentedRawLock<R> {
     // A “non-constant” const item is a legacy way to supply an initialized value to downstream
     // static items. Can hopefully be replaced with `const fn new() -> Self` at some point.
-    #[expect(clippy::declare_interior_mutable_const)]
     const INIT: Self = Self {
         inner: R::INIT,
         metrics: None,
@@ -328,7 +327,6 @@ unsafe impl<R: lock_api::RawRwLockUpgrade + Sized> lock_api::RawRwLockUpgrade
 unsafe impl<R: lock_api::RawMutex + Sized> lock_api::RawMutex for InstrumentedRawLock<R> {
     // A “non-constant” const item is a legacy way to supply an initialized value to downstream
     // static items. Can hopefully be replaced with `const fn new() -> Self` at some point.
-    #[expect(clippy::declare_interior_mutable_const)]
     const INIT: Self = Self {
         inner: R::INIT,
         metrics: None,