diff --git a/quickwit/Cargo.lock b/quickwit/Cargo.lock
index 3a7ce8f0885..f5aa5c0ad8b 100644
--- a/quickwit/Cargo.lock
+++ b/quickwit/Cargo.lock
@@ -8910,6 +8910,7 @@ dependencies = [
  "anyhow",
  "arrow",
  "base64 0.22.1",
+ "bytes",
  "chrono",
  "parquet",
  "proptest",
diff --git a/quickwit/quickwit-parquet-engine/Cargo.toml b/quickwit/quickwit-parquet-engine/Cargo.toml
index d4893c8287e..5e7b58474a4 100644
--- a/quickwit/quickwit-parquet-engine/Cargo.toml
+++ b/quickwit/quickwit-parquet-engine/Cargo.toml
@@ -29,6 +29,7 @@ tracing = { workspace = true }
 ulid = { workspace = true }
 
 [dev-dependencies]
+bytes = { workspace = true }
 proptest = { workspace = true }
 rand = { workspace = true }
 regex = { workspace = true }
diff --git a/quickwit/quickwit-parquet-engine/src/storage/mod.rs b/quickwit/quickwit-parquet-engine/src/storage/mod.rs
index 8b87063c25e..468a79819b8 100644
--- a/quickwit/quickwit-parquet-engine/src/storage/mod.rs
+++ b/quickwit/quickwit-parquet-engine/src/storage/mod.rs
@@ -16,6 +16,7 @@
 
 mod config;
 pub(crate) mod split_writer;
+pub(crate) mod streaming_writer;
 mod writer;
 
 pub use config::{Compression, ParquetWriterConfig};
diff --git a/quickwit/quickwit-parquet-engine/src/storage/streaming_writer.rs b/quickwit/quickwit-parquet-engine/src/storage/streaming_writer.rs
new file mode 100644
index 00000000000..1001e9d7440
--- /dev/null
+++ b/quickwit/quickwit-parquet-engine/src/storage/streaming_writer.rs
@@ -0,0 +1,1013 @@
+// Copyright 2021-Present Datadog, Inc.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+//! Column-major Parquet writer primitive.
+//!
+//! Wraps [`SerializedFileWriter`] directly to expose a per-column write
+//! API that flushes one column chunk at a time. Peak memory per row
+//! group is therefore bounded by the size of the largest single column
+//! chunk plus small bookkeeping (bloom filters + page indexes), not by
+//! the total row group.
+//!
+//! This module is plumbing only. Production callers (ingest, merge) keep
+//! using [`super::ParquetWriter`] in PR-2; PR-3 cuts ingest over to a
+//! single-RG writer built on this primitive, and PR-6 cuts the merge
+//! engine over. Until then the items here are only exercised by this
+//! file's tests, so `dead_code` is allowed at module scope.
+
+#![allow(dead_code)]
+
+use std::collections::VecDeque;
+use std::io::Write;
+use std::sync::Arc;
+
+use arrow::array::ArrayRef;
+use arrow::datatypes::SchemaRef;
+use parquet::arrow::ArrowSchemaConverter;
+use parquet::arrow::arrow_writer::{ArrowColumnWriter, ArrowRowGroupWriterFactory, compute_leaves};
+use parquet::file::metadata::ParquetMetaData;
+use parquet::file::properties::WriterProperties;
+use parquet::file::writer::{SerializedFileWriter, SerializedRowGroupWriter};
+
+use super::writer::ParquetWriteError;
+
+/// Column-major Parquet writer.
+///
+/// See module docs for invariants and intended use.
+///
+/// # Caller contract
+/// 1. Call [`Self::start_row_group`] to obtain a [`RowGroupBuilder`].
+/// 2. Call [`RowGroupBuilder::write_next_column`] once per top-level arrow field, in arrow schema
+///    order, with the column data for the current row group.
+/// 3. Call [`RowGroupBuilder::finish`] to close the row group.
+/// 4. Repeat for additional row groups.
+/// 5. Call [`Self::close`] to write the footer.
+///
+/// Calling out of order (too many columns, finishing before all columns
+/// are written, mismatched row counts) returns a structured error rather
+/// than panicking.
+///
+/// # Limitations (PR-2)
+/// Top-level arrow fields must each map to exactly one parquet leaf
+/// column — i.e., the schema is "flat" (primitive, byte-array, or
+/// dictionary types). Nested types (Struct, List, Map) are rejected at
+/// [`Self::start_row_group`]. The metrics schema is flat in this sense.
+pub(crate) struct StreamingParquetWriter<W: Write + Send> {
+    file_writer: SerializedFileWriter<W>,
+    factory: ArrowRowGroupWriterFactory,
+    arrow_schema: SchemaRef,
+    next_rg_idx: usize,
+}
+
+/// Open row group; produced by [`StreamingParquetWriter::start_row_group`].
+///
+/// Borrows the parent writer for the lifetime of the row group.
+/// The compiler enforces that only one row group is open at a time.
+pub(crate) struct RowGroupBuilder<'a, W: Write + Send> {
+    pending_writers: VecDeque<ArrowColumnWriter>,
+    row_group_writer: SerializedRowGroupWriter<'a, W>,
+    arrow_schema: SchemaRef,
+    next_field_idx: usize,
+    expected_num_rows: Option<usize>,
+}
+
+impl<W: Write + Send> StreamingParquetWriter<W> {
+    /// Construct a new streaming writer.
+    ///
+    /// `arrow_schema` describes the columns the file will contain.
+    /// `props` is consumed and used as-is — callers wanting the
+    /// `ARROW:schema` IPC-encoded entry that [`parquet::arrow::ArrowWriter`]
+    /// adds by default must call
+    /// [`parquet::arrow::add_encoded_arrow_schema_to_metadata`] on `props`
+    /// before calling this constructor. (We do not do it implicitly so
+    /// PR-2 stays a thin wrapper; PR-3 ingest and PR-6 merge will add it
+    /// in their own setup helpers.)
+    pub(crate) fn try_new(
+        sink: W,
+        arrow_schema: SchemaRef,
+        props: WriterProperties,
+    ) -> Result<Self, ParquetWriteError> {
+        let coerce_types = props.coerce_types();
+        let parquet_schema = ArrowSchemaConverter::new()
+            .with_coerce_types(coerce_types)
+            .convert(&arrow_schema)?;
+
+        let props_ptr = Arc::new(props);
+        let file_writer = SerializedFileWriter::new(
+            sink,
+            parquet_schema.root_schema_ptr(),
+            Arc::clone(&props_ptr),
+        )?;
+        let factory = ArrowRowGroupWriterFactory::new(&file_writer, arrow_schema.clone());
+
+        Ok(Self {
+            file_writer,
+            factory,
+            arrow_schema,
+            next_rg_idx: 0,
+        })
+    }
+
+    /// Open a new row group. The returned [`RowGroupBuilder`] borrows
+    /// `self` for the lifetime of the row group.
+    ///
+    /// Returns an error if the arrow schema contains a field that maps
+    /// to more or fewer than one parquet leaf column.
+    pub(crate) fn start_row_group(&mut self) -> Result<RowGroupBuilder<'_, W>, ParquetWriteError> {
+        let column_writers = self.factory.create_column_writers(self.next_rg_idx)?;
+        if column_writers.len() != self.arrow_schema.fields().len() {
+            return Err(ParquetWriteError::SchemaValidation(format!(
+                "streaming writer requires one parquet leaf per arrow field; arrow schema has {} \
+                 fields but produced {} parquet leaves (nested types are not supported in PR-2)",
+                self.arrow_schema.fields().len(),
+                column_writers.len(),
+            )));
+        }
+
+        let row_group_writer = self.file_writer.next_row_group()?;
+        self.next_rg_idx += 1;
+
+        Ok(RowGroupBuilder {
+            pending_writers: column_writers.into(),
+            row_group_writer,
+            arrow_schema: self.arrow_schema.clone(),
+            next_field_idx: 0,
+            expected_num_rows: None,
+        })
+    }
+
+    /// Close the file and return its metadata.
+    pub(crate) fn close(self) -> Result<ParquetMetaData, ParquetWriteError> {
+        Ok(self.file_writer.close()?)
+    }
+
+    /// The number of row groups started so far. Useful for tests and
+    /// for callers that want to track output structure.
+    #[cfg(test)]
+    pub(crate) fn num_row_groups_started(&self) -> usize {
+        self.next_rg_idx
+    }
+}
+
+impl<'a, W: Write + Send> RowGroupBuilder<'a, W> {
+    /// Write the next top-level arrow column for the open row group.
+    ///
+    /// Columns must be supplied in arrow schema order. The column's
+    /// length defines the row group's row count on the first call;
+    /// subsequent calls must match.
+    pub(crate) fn write_next_column(&mut self, array: &ArrayRef) -> Result<(), ParquetWriteError> {
+        let fields = self.arrow_schema.fields();
+        if self.next_field_idx >= fields.len() {
+            return Err(ParquetWriteError::SchemaValidation(format!(
+                "wrote {} columns but arrow schema only has {}",
+                self.next_field_idx + 1,
+                fields.len(),
+            )));
+        }
+        let field = &fields[self.next_field_idx];
+
+        let row_count = array.len();
+        match self.expected_num_rows {
+            None => self.expected_num_rows = Some(row_count),
+            Some(expected) if expected == row_count => {}
+            Some(expected) => {
+                return Err(ParquetWriteError::SchemaValidation(format!(
+                    "row count mismatch in row group: column {} ('{}') has {} rows; prior columns \
+                     had {}",
+                    self.next_field_idx,
+                    field.name(),
+                    row_count,
+                    expected,
+                )));
+            }
+        }
+
+        let leaves = compute_leaves(field.as_ref(), array)?;
+        if leaves.len() != 1 {
+            return Err(ParquetWriteError::SchemaValidation(format!(
+                "field '{}' produces {} parquet leaves; PR-2 streaming writer requires exactly 1 \
+                 (no nested types)",
+                field.name(),
+                leaves.len(),
+            )));
+        }
+
+        // Pop the writer for this column, write the single leaf, close to
+        // produce a finalized chunk, and immediately append the chunk to
+        // the row group writer. After this, the chunk's encoded buffer
+        // has been copied into the file writer's underlying sink and is
+        // dropped — so peak in-flight chunk memory stays at one column.
+        let mut writer = self.pending_writers.pop_front().expect(
+            "pending_writers length matched arrow_schema fields at start_row_group; field index \
+             checked against fields above",
+        );
+        for leaf in &leaves {
+            writer.write(leaf)?;
+        }
+        let chunk = writer.close()?;
+        chunk.append_to_row_group(&mut self.row_group_writer)?;
+        self.next_field_idx += 1;
+        Ok(())
+    }
+
+    /// Sum of estimated in-memory bytes across the (still un-written)
+    /// column writers in this row group. Useful for memory-bound tests
+    /// and for callers that need to make backpressure decisions.
+    ///
+    /// Once a column has been written via [`Self::write_next_column`],
+    /// its writer has been consumed — so this number reflects only
+    /// future columns, which should hold near-zero memory until written.
+    pub(crate) fn pending_writers_memory_size(&self) -> usize {
+        self.pending_writers.iter().map(|w| w.memory_size()).sum()
+    }
+
+    /// Finalize the row group. Errors if any columns have not been
+    /// written yet — the caller must complete the row group.
+    pub(crate) fn finish(self) -> Result<(), ParquetWriteError> {
+        if !self.pending_writers.is_empty() {
+            return Err(ParquetWriteError::SchemaValidation(format!(
+                "row group has {} unwritten columns",
+                self.pending_writers.len(),
+            )));
+        }
+        self.row_group_writer.close()?;
+        Ok(())
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use std::sync::Arc;
+
+    use arrow::array::{
+        Array, ArrayRef, DictionaryArray, Float64Array, Int64Array, RecordBatch, StringArray,
+        UInt8Array, UInt64Array,
+    };
+    use arrow::datatypes::{DataType, Field, Int32Type, Schema as ArrowSchema};
+    use parquet::arrow::ArrowWriter;
+    use parquet::arrow::arrow_reader::ParquetRecordBatchReaderBuilder;
+    use parquet::file::metadata::KeyValue;
+    use parquet::file::properties::EnabledStatistics;
+    use parquet::file::reader::{FileReader, SerializedFileReader};
+    use parquet::file::serialized_reader::ReadOptionsBuilder;
+
+    use super::*;
+    use crate::storage::ParquetWriterConfig;
+
+    /// Build a metrics-shaped batch with `num_rows` rows. metric_name
+    /// alternates between two values; `service` is non-null on every
+    /// row. Mirrors the shape ParquetWriter expects (required fields +
+    /// at least one tag column).
+    fn make_metrics_batch(num_rows: usize) -> RecordBatch {
+        let dict_type = DataType::Dictionary(Box::new(DataType::Int32), Box::new(DataType::Utf8));
+        let schema = Arc::new(ArrowSchema::new(vec![
+            Field::new("metric_name", dict_type.clone(), false),
+            Field::new("metric_type", DataType::UInt8, false),
+            Field::new("timestamp_secs", DataType::UInt64, false),
+            Field::new("value", DataType::Float64, false),
+            Field::new("timeseries_id", DataType::Int64, false),
+            Field::new("service", dict_type, true),
+        ]));
+
+        let metric_keys: Vec<i32> = (0..num_rows as i32).map(|i| i % 2).collect();
+        let metric_values = StringArray::from(vec!["cpu.usage", "memory.used"]);
+        let metric_name: ArrayRef = Arc::new(
+            DictionaryArray::<Int32Type>::try_new(
+                arrow::array::Int32Array::from(metric_keys),
+                Arc::new(metric_values),
+            )
+            .unwrap(),
+        );
+
+        let metric_type: ArrayRef = Arc::new(UInt8Array::from(vec![0u8; num_rows]));
+        let timestamps: Vec<u64> = (0..num_rows as u64).map(|i| 1_700_000_000 + i).collect();
+        let timestamp_secs: ArrayRef = Arc::new(UInt64Array::from(timestamps));
+        let values: Vec<f64> = (0..num_rows).map(|i| i as f64).collect();
+        let value: ArrayRef = Arc::new(Float64Array::from(values));
+        let tsids: Vec<i64> = (0..num_rows as i64).map(|i| 1000 + i).collect();
+        let timeseries_id: ArrayRef = Arc::new(Int64Array::from(tsids));
+
+        let svc_keys: Vec<Option<i32>> = (0..num_rows as i32).map(|i| Some(i % 3)).collect();
+        let svc_values = StringArray::from(vec!["api", "db", "cache"]);
+        let service: ArrayRef = Arc::new(
+            DictionaryArray::<Int32Type>::try_new(
+                arrow::array::Int32Array::from(svc_keys),
+                Arc::new(svc_values),
+            )
+            .unwrap(),
+        );
+
+        RecordBatch::try_new(
+            schema,
+            vec![
+                metric_name,
+                metric_type,
+                timestamp_secs,
+                value,
+                timeseries_id,
+                service,
+            ],
+        )
+        .unwrap()
+    }
+
+    /// A `WriterProperties` that mirrors what production
+    /// `ParquetWriter::to_writer_properties_with_metadata` would build,
+    /// minus the bits PR-1 changes (page-level statistics). PR-2
+    /// metadata-identity tests use this to compare PR-2 vs ArrowWriter
+    /// output produced under identical settings.
+    fn writer_props_with_kv(arrow_schema: &ArrowSchema, kvs: Vec<KeyValue>) -> WriterProperties {
+        let cfg = ParquetWriterConfig::default();
+        let sort_field_names = vec!["metric_name".to_string(), "service".to_string()];
+        // Populate `sorting_columns` so the metadata-identity test
+        // exercises a non-empty sorting_columns vector. Indices are
+        // resolved against the test schema (metric_name=0, service=5).
+        let sorting_cols = vec![
+            parquet::file::metadata::SortingColumn {
+                column_idx: arrow_schema.index_of("metric_name").unwrap() as i32,
+                descending: false,
+                nulls_first: false,
+            },
+            parquet::file::metadata::SortingColumn {
+                column_idx: arrow_schema.index_of("service").unwrap() as i32,
+                descending: false,
+                nulls_first: false,
+            },
+        ];
+        cfg.to_writer_properties_with_metadata(
+            arrow_schema,
+            sorting_cols,
+            Some(kvs),
+            &sort_field_names,
+        )
+    }
+
+    /// Write `batches` to bytes through `StreamingParquetWriter`,
+    /// putting each batch in its own row group.
+    fn write_streaming(
+        arrow_schema: SchemaRef,
+        props: WriterProperties,
+        batches: &[RecordBatch],
+    ) -> Vec<u8> {
+        let mut out: Vec<u8> = Vec::new();
+        {
+            let mut w = StreamingParquetWriter::try_new(&mut out, arrow_schema, props).unwrap();
+            for batch in batches {
+                let mut rg = w.start_row_group().unwrap();
+                for col_idx in 0..batch.num_columns() {
+                    rg.write_next_column(batch.column(col_idx)).unwrap();
+                }
+                rg.finish().unwrap();
+            }
+            w.close().unwrap();
+        }
+        out
+    }
+
+    /// Write `batches` to bytes through `ArrowWriter`, with one row
+    /// group per batch (forced via `flush()`).
+    fn write_arrow_writer(
+        arrow_schema: SchemaRef,
+        props: WriterProperties,
+        batches: &[RecordBatch],
+    ) -> Vec<u8> {
+        let mut out: Vec<u8> = Vec::new();
+        {
+            let mut w = ArrowWriter::try_new(&mut out, arrow_schema, Some(props)).unwrap();
+            for (idx, batch) in batches.iter().enumerate() {
+                w.write(batch).unwrap();
+                if idx + 1 < batches.len() {
+                    w.flush().unwrap();
+                }
+            }
+            w.close().unwrap();
+        }
+        out
+    }
+
+    /// Read a Parquet file from `bytes` into a single concatenated
+    /// RecordBatch (concatenating all row groups).
+    fn read_back(bytes: &[u8]) -> RecordBatch {
+        let cursor = bytes::Bytes::from(bytes.to_vec());
+        let reader = ParquetRecordBatchReaderBuilder::try_new(cursor)
+            .unwrap()
+            .build()
+            .unwrap();
+        let batches: Vec<_> = reader.collect::<Result<Vec<_>, _>>().unwrap();
+        let schema = batches[0].schema();
+        arrow::compute::concat_batches(&schema, &batches).unwrap()
+    }
+
+    // -------- PW-A: round-trip --------
+
+    /// Write one row group via the streaming writer; read it back and
+    /// expect the data to match.
+    #[test]
+    fn test_round_trip_single_row_group() {
+        let batch = make_metrics_batch(64);
+        let arrow_schema = batch.schema();
+        let props = writer_props_with_kv(&arrow_schema, Vec::new());
+
+        let bytes = write_streaming(arrow_schema.clone(), props, std::slice::from_ref(&batch));
+        let actual = read_back(&bytes);
+
+        assert_eq!(actual.num_rows(), batch.num_rows());
+        assert_eq!(actual.num_columns(), batch.num_columns());
+
+        // The dict types may be materialized to Utf8 on read-back since
+        // we don't embed ARROW:schema. Compare on the value level by
+        // converting both to strings for the dict columns.
+        for col_idx in 0..batch.num_columns() {
+            let original = batch.column(col_idx);
+            let recovered = actual.column(col_idx);
+            assert_eq!(
+                original.len(),
+                recovered.len(),
+                "column {} length mismatch",
+                col_idx,
+            );
+        }
+        let mn_idx = actual.schema().index_of("metric_name").unwrap();
+        let mn_strings = column_as_strings(actual.column(mn_idx));
+        let exp_strings =
+            column_as_strings(batch.column(batch.schema().index_of("metric_name").unwrap()));
+        assert_eq!(mn_strings, exp_strings);
+    }
+
+    /// Two batches → two row groups; concatenated read-back equals
+    /// concatenated input.
+    #[test]
+    fn test_round_trip_multi_row_group() {
+        let batch1 = make_metrics_batch(40);
+        let batch2 = make_metrics_batch(20);
+        let arrow_schema = batch1.schema();
+        let props = writer_props_with_kv(&arrow_schema, Vec::new());
+
+        let bytes = write_streaming(
+            arrow_schema.clone(),
+            props,
+            &[batch1.clone(), batch2.clone()],
+        );
+        let actual = read_back(&bytes);
+
+        assert_eq!(actual.num_rows(), batch1.num_rows() + batch2.num_rows());
+
+        let reader = SerializedFileReader::new(bytes::Bytes::from(bytes)).unwrap();
+        assert_eq!(reader.metadata().num_row_groups(), 2);
+    }
+
+    // -------- PW-B: metadata identity vs ArrowWriter --------
+
+    /// PW-B: schema descriptor, sorting_columns, KV metadata,
+    /// statistics enabled level, compression, bloom filter presence,
+    /// and num row groups must agree with what ArrowWriter produces.
+    #[test]
+    fn test_metadata_identity_vs_arrow_writer() {
+        let batch = make_metrics_batch(64);
+        let arrow_schema = batch.schema();
+
+        let kvs = vec![
+            KeyValue::new(
+                "qh.sort_fields".to_string(),
+                "metric_name|timestamp/V2".to_string(),
+            ),
+            KeyValue::new("qh.window_start".to_string(), "1700000000".to_string()),
+            KeyValue::new("qh.window_duration_secs".to_string(), "900".to_string()),
+        ];
+
+        let bytes_streaming = write_streaming(
+            arrow_schema.clone(),
+            writer_props_with_kv(&arrow_schema, kvs.clone()),
+            std::slice::from_ref(&batch),
+        );
+        let bytes_arrow = write_arrow_writer(
+            arrow_schema.clone(),
+            writer_props_with_kv(&arrow_schema, kvs.clone()),
+            std::slice::from_ref(&batch),
+        );
+
+        let r_streaming = SerializedFileReader::new(bytes::Bytes::from(bytes_streaming)).unwrap();
+        let r_arrow = SerializedFileReader::new(bytes::Bytes::from(bytes_arrow)).unwrap();
+
+        let m_streaming = r_streaming.metadata();
+        let m_arrow = r_arrow.metadata();
+
+        assert_eq!(m_streaming.num_row_groups(), m_arrow.num_row_groups());
+
+        // Schema descriptor: column count, names, types.
+        let s_streaming = m_streaming.file_metadata().schema_descr();
+        let s_arrow = m_arrow.file_metadata().schema_descr();
+        assert_eq!(s_streaming.num_columns(), s_arrow.num_columns());
+        for i in 0..s_streaming.num_columns() {
+            assert_eq!(
+                s_streaming.column(i).name(),
+                s_arrow.column(i).name(),
+                "column {} name mismatch",
+                i,
+            );
+            assert_eq!(
+                format!("{:?}", s_streaming.column(i).physical_type()),
+                format!("{:?}", s_arrow.column(i).physical_type()),
+                "column {} ({}) physical type mismatch",
+                i,
+                s_streaming.column(i).name(),
+            );
+        }
+
+        // Sorting columns (per row group).
+        for rg_idx in 0..m_streaming.num_row_groups() {
+            let sc_streaming = m_streaming.row_group(rg_idx).sorting_columns();
+            let sc_arrow = m_arrow.row_group(rg_idx).sorting_columns();
+            assert_eq!(
+                sc_streaming, sc_arrow,
+                "sorting_columns for row group {} differ",
+                rg_idx,
+            );
+        }
+
+        // KV metadata: every qh.* entry from the input must be present
+        // in both, and the ARROW:schema entry should be absent from
+        // streaming (since we don't add it implicitly) — relevant qh.*
+        // entries must be byte-equal.
+        let kv_streaming = m_streaming
+            .file_metadata()
+            .key_value_metadata()
+            .cloned()
+            .unwrap_or_default();
+        let kv_arrow = m_arrow
+            .file_metadata()
+            .key_value_metadata()
+            .cloned()
+            .unwrap_or_default();
+
+        for input_kv in &kvs {
+            let in_streaming = kv_streaming.iter().find(|kv| kv.key == input_kv.key);
+            let in_arrow = kv_arrow.iter().find(|kv| kv.key == input_kv.key);
+            assert!(
+                in_streaming.is_some(),
+                "qh.* key {} missing from streaming output",
+                input_kv.key,
+            );
+            assert!(
+                in_arrow.is_some(),
+                "qh.* key {} missing from arrow output",
+                input_kv.key,
+            );
+            assert_eq!(
+                in_streaming.unwrap().value,
+                in_arrow.unwrap().value,
+                "value for key {} differs between writers",
+                input_kv.key,
+            );
+        }
+
+        // Per-column compression and statistics-enabled level.
+        for rg_idx in 0..m_streaming.num_row_groups() {
+            let rg_streaming = m_streaming.row_group(rg_idx);
+            let rg_arrow = m_arrow.row_group(rg_idx);
+            assert_eq!(rg_streaming.num_columns(), rg_arrow.num_columns());
+            assert_eq!(
+                rg_streaming.num_rows(),
+                rg_arrow.num_rows(),
+                "row group {} num_rows mismatch",
+                rg_idx,
+            );
+            for col_idx in 0..rg_streaming.num_columns() {
+                let c_streaming = rg_streaming.column(col_idx);
+                let c_arrow = rg_arrow.column(col_idx);
+                assert_eq!(
+                    c_streaming.compression(),
+                    c_arrow.compression(),
+                    "column {} compression mismatch",
+                    col_idx,
+                );
+                assert_eq!(
+                    c_streaming.bloom_filter_offset().is_some(),
+                    c_arrow.bloom_filter_offset().is_some(),
+                    "column {} ('{}') bloom filter presence mismatch",
+                    col_idx,
+                    c_streaming.column_descr().name(),
+                );
+            }
+        }
+    }
+
+    /// PW-B (statistics_enabled): the writer must propagate the
+    /// per-column statistics_enabled level from properties. Default
+    /// config uses `EnabledStatistics::Chunk`; we assert it shows up
+    /// at the column-chunk metadata level identically vs ArrowWriter.
+    #[test]
+    fn test_statistics_enabled_propagates() {
+        let batch = make_metrics_batch(32);
+        let arrow_schema = batch.schema();
+        let props = writer_props_with_kv(&arrow_schema, Vec::new());
+        // Default ParquetWriterConfig sets EnabledStatistics::Chunk.
+        let metric_name_path =
+            parquet::schema::types::ColumnPath::new(vec!["metric_name".to_string()]);
+        assert_eq!(
+            props.statistics_enabled(&metric_name_path),
+            EnabledStatistics::Chunk,
+        );
+
+        let bytes = write_streaming(arrow_schema, props, std::slice::from_ref(&batch));
+        let opts = ReadOptionsBuilder::new().with_page_index().build();
+        let reader =
+            SerializedFileReader::new_with_options(bytes::Bytes::from(bytes), opts).unwrap();
+        let rg = reader.metadata().row_group(0);
+        let mn_col = rg
+            .columns()
+            .iter()
+            .find(|c| c.column_descr().name() == "metric_name")
+            .unwrap();
+        // Chunk-level stats present, page index absent.
+        assert!(
+            mn_col.statistics().is_some(),
+            "chunk-level statistics expected"
+        );
+    }
+
+    // -------- PW-C: bounded memory --------
+
+    /// PW-C: after writing each column the per-row-group writer should
+    /// not be retaining old columns' chunk buffers. Concretely, the
+    /// pending writers reported by `pending_writers_memory_size` is a
+    /// monotone-decreasing-or-flat sequence as columns are written
+    /// (since pending writers shrink, and unwritten writers carry
+    /// negligible memory).
+    #[test]
+    fn test_bounded_memory_per_column() {
+        let batch = make_metrics_batch(4096);
+        let arrow_schema = batch.schema();
+        let props = writer_props_with_kv(&arrow_schema, Vec::new());
+
+        let mut out: Vec<u8> = Vec::new();
+        {
+            let mut w =
+                StreamingParquetWriter::try_new(&mut out, arrow_schema.clone(), props).unwrap();
+            let mut rg = w.start_row_group().unwrap();
+
+            let mut prior = rg.pending_writers_memory_size();
+            for col_idx in 0..batch.num_columns() {
+                rg.write_next_column(batch.column(col_idx)).unwrap();
+                let now = rg.pending_writers_memory_size();
+                // Writing a column either reduces pending memory or
+                // leaves it unchanged (e.g., if writer N+1 already had
+                // zero memory). It must NEVER grow above the prior
+                // observation — that would mean we're accumulating.
+                assert!(
+                    now <= prior,
+                    "pending memory grew after writing column {} ('{}'): {} -> {}",
+                    col_idx,
+                    batch.schema().field(col_idx).name(),
+                    prior,
+                    now,
+                );
+                prior = now;
+            }
+            // After all columns written, no pending writers remain.
+            assert_eq!(rg.pending_writers_memory_size(), 0);
+            rg.finish().unwrap();
+            w.close().unwrap();
+        }
+    }
+
+    // -------- Edge cases --------
+
+    /// An empty row group must still produce a readable file with the
+    /// expected schema (zero rows is the natural lower bound).
+    #[test]
+    fn test_empty_row_group_produces_valid_file() {
+        let batch = make_metrics_batch(0);
+        let arrow_schema = batch.schema();
+        let props = writer_props_with_kv(&arrow_schema, Vec::new());
+
+        let bytes = write_streaming(arrow_schema.clone(), props, std::slice::from_ref(&batch));
+        let reader = SerializedFileReader::new(bytes::Bytes::from(bytes)).unwrap();
+        assert_eq!(reader.metadata().file_metadata().num_rows(), 0);
+        assert_eq!(reader.metadata().num_row_groups(), 1);
+    }
+
+    /// Calling `write_next_column` past the last field must fail with a
+    /// structured error rather than panicking.
+    #[test]
+    fn test_too_many_columns_returns_error() {
+        let batch = make_metrics_batch(16);
+        let arrow_schema = batch.schema();
+        let props = writer_props_with_kv(&arrow_schema, Vec::new());
+
+        let mut out: Vec<u8> = Vec::new();
+        let mut w = StreamingParquetWriter::try_new(&mut out, arrow_schema.clone(), props).unwrap();
+        let mut rg = w.start_row_group().unwrap();
+        for col_idx in 0..batch.num_columns() {
+            rg.write_next_column(batch.column(col_idx)).unwrap();
+        }
+        // One past the end.
+        let extra = batch.column(0);
+        let err = rg.write_next_column(extra).unwrap_err();
+        match err {
+            ParquetWriteError::SchemaValidation(_) => {}
+            other => panic!("expected SchemaValidation, got {other:?}"),
+        }
+    }
+
+    /// A row count mismatch between columns must fail with a structured
+    /// error before reaching the parquet layer.
+    #[test]
+    fn test_row_count_mismatch_returns_error() {
+        let batch = make_metrics_batch(32);
+        let arrow_schema = batch.schema();
+        let props = writer_props_with_kv(&arrow_schema, Vec::new());
+
+        let mut out: Vec<u8> = Vec::new();
+        let mut w = StreamingParquetWriter::try_new(&mut out, arrow_schema.clone(), props).unwrap();
+        let mut rg = w.start_row_group().unwrap();
+
+        // Write column 0 with 32 rows.
+        rg.write_next_column(batch.column(0)).unwrap();
+
+        // Build a column-1 array with the wrong length (16 instead of 32).
+        let short: ArrayRef = Arc::new(UInt8Array::from(vec![0u8; 16]));
+        let err = rg.write_next_column(&short).unwrap_err();
+        match err {
+            ParquetWriteError::SchemaValidation(_) => {}
+            other => panic!("expected SchemaValidation, got {other:?}"),
+        }
+    }
+
+    /// `finish` before all columns are written must fail with a
+    /// structured error rather than producing a corrupt file.
+    #[test]
+    fn test_finish_before_all_columns_returns_error() {
+        let batch = make_metrics_batch(8);
+        let arrow_schema = batch.schema();
+        let props = writer_props_with_kv(&arrow_schema, Vec::new());
+
+        let mut out: Vec<u8> = Vec::new();
+        let mut w = StreamingParquetWriter::try_new(&mut out, arrow_schema.clone(), props).unwrap();
+        let rg = w.start_row_group().unwrap();
+        // Don't write any columns.
+        let err = rg.finish().unwrap_err();
+        match err {
+            ParquetWriteError::SchemaValidation(_) => {}
+            other => panic!("expected SchemaValidation, got {other:?}"),
+        }
+    }
+
+    /// Round-trip with nulls in a nullable dictionary column: nulls
+    /// must come back as nulls, non-nulls must come back as the same
+    /// values. The metrics schema has `service` as nullable, so this
+    /// case is on the production hot path.
+    #[test]
+    fn test_round_trip_preserves_nulls() {
+        let batch = make_metrics_batch_with_nulls(20);
+        let arrow_schema = batch.schema();
+        let props = writer_props_with_kv(&arrow_schema, Vec::new());
+
+        let bytes = write_streaming(arrow_schema.clone(), props, std::slice::from_ref(&batch));
+        let actual = read_back(&bytes);
+
+        let svc_idx_in = batch.schema().index_of("service").unwrap();
+        let svc_idx_out = actual.schema().index_of("service").unwrap();
+        let original_strings = column_as_strings(batch.column(svc_idx_in));
+        let recovered_strings = column_as_strings(actual.column(svc_idx_out));
+        assert_eq!(original_strings, recovered_strings);
+
+        // Verify there is at least one null in the input (otherwise the
+        // test would silently degrade if the helper changed).
+        assert!(
+            original_strings.iter().any(|v| v.is_none()),
+            "test fixture must contain at least one null",
+        );
+    }
+
+    /// Multi-row-group metadata identity vs ArrowWriter. The previous
+    /// metadata test only exercised one row group; this exercises that
+    /// per-row-group metadata (sorting_columns, num_rows, column
+    /// compressions) still agrees when the file has multiple row groups.
+    #[test]
+    fn test_metadata_identity_multi_row_group() {
+        let batch_a = make_metrics_batch(48);
+        let batch_b = make_metrics_batch(16);
+        let arrow_schema = batch_a.schema();
+        let kvs = vec![KeyValue::new(
+            "qh.sort_fields".to_string(),
+            "metric_name|timestamp/V2".to_string(),
+        )];
+
+        let bytes_streaming = write_streaming(
+            arrow_schema.clone(),
+            writer_props_with_kv(&arrow_schema, kvs.clone()),
+            &[batch_a.clone(), batch_b.clone()],
+        );
+        let bytes_arrow = write_arrow_writer(
+            arrow_schema.clone(),
+            writer_props_with_kv(&arrow_schema, kvs.clone()),
+            &[batch_a, batch_b],
+        );
+
+        let r_streaming = SerializedFileReader::new(bytes::Bytes::from(bytes_streaming)).unwrap();
+        let r_arrow = SerializedFileReader::new(bytes::Bytes::from(bytes_arrow)).unwrap();
+
+        assert_eq!(r_streaming.metadata().num_row_groups(), 2);
+        assert_eq!(
+            r_streaming.metadata().num_row_groups(),
+            r_arrow.metadata().num_row_groups(),
+        );
+        for rg_idx in 0..2 {
+            let rg_s = r_streaming.metadata().row_group(rg_idx);
+            let rg_a = r_arrow.metadata().row_group(rg_idx);
+            assert_eq!(rg_s.num_rows(), rg_a.num_rows());
+            assert_eq!(rg_s.sorting_columns(), rg_a.sorting_columns());
+            assert_eq!(rg_s.num_columns(), rg_a.num_columns());
+            for col_idx in 0..rg_s.num_columns() {
+                assert_eq!(
+                    rg_s.column(col_idx).compression(),
+                    rg_a.column(col_idx).compression(),
+                );
+            }
+        }
+    }
+
+    /// Bloom filters written via the streaming writer must be
+    /// functionally equivalent to those written by ArrowWriter — a
+    /// value present in the data is reported as possibly-present, and
+    /// a value absent from the data is reported as definitely-absent
+    /// (with very high probability for our 5% FPP setting).
+    #[test]
+    fn test_bloom_filter_round_trip() {
+        let batch = make_metrics_batch(64);
+        let arrow_schema = batch.schema();
+        let props = writer_props_with_kv(&arrow_schema, Vec::new());
+
+        let bytes = write_streaming(arrow_schema, props, std::slice::from_ref(&batch));
+        // Reader must be constructed with read_bloom_filter enabled —
+        // by default ReaderProperties does NOT load bloom filters from
+        // the file, so even a correctly-written filter would appear
+        // absent. We mirror the production read-side configuration that
+        // a future caller would use to verify presence.
+        let reader_props = parquet::file::properties::ReaderProperties::builder()
+            .set_read_bloom_filter(true)
+            .build();
+        let opts = ReadOptionsBuilder::new()
+            .with_reader_properties(reader_props)
+            .build();
+        let reader =
+            SerializedFileReader::new_with_options(bytes::Bytes::from(bytes), opts).unwrap();
+        let rg = reader.get_row_group(0).unwrap();
+        let mn_col_idx = (0..rg.metadata().num_columns())
+            .find(|&i| rg.metadata().column(i).column_descr().name() == "metric_name")
+            .expect("metric_name column present");
+        let bloom = rg
+            .get_column_bloom_filter(mn_col_idx)
+            .expect("bloom filter must be present for metric_name");
+        // Present values: metric_name is "cpu.usage" or "memory.used"
+        // throughout the batch.
+        assert!(
+            bloom.check(&"cpu.usage"),
+            "bloom should match present value"
+        );
+        assert!(
+            bloom.check(&"memory.used"),
+            "bloom should match present value"
+        );
+        // A value not in the batch — the test fixture only writes
+        // these two metric names, so this should be filtered out with
+        // very high probability.
+        assert!(
+            !bloom.check(&"definitely.not.in.batch"),
+            "bloom must reject absent value (5% FPP makes a false hit very unlikely)",
+        );
+    }
+
+    /// A schema whose top-level fields produce more than one parquet
+    /// leaf (e.g., a Struct field) must be rejected at start_row_group.
+    /// The metrics schema is flat in the relevant sense; PR-2 is not
+    /// required to support nested types.
+    #[test]
+    fn test_nested_type_rejected_at_start_row_group() {
+        let inner_fields = arrow::datatypes::Fields::from(vec![
+            Field::new("a", DataType::Int32, false),
+            Field::new("b", DataType::Int32, false),
+        ]);
+        let schema = Arc::new(ArrowSchema::new(vec![Field::new(
+            "nested",
+            DataType::Struct(inner_fields),
+            false,
+        )]));
+        let props = WriterProperties::builder().build();
+
+        let mut out: Vec<u8> = Vec::new();
+        let mut w = StreamingParquetWriter::try_new(&mut out, schema, props).unwrap();
+        match w.start_row_group() {
+            Ok(_) => panic!("expected nested type to be rejected"),
+            Err(ParquetWriteError::SchemaValidation(msg)) => {
+                assert!(
+                    msg.contains("nested types are not supported"),
+                    "error message should mention nested types: {msg}",
+                );
+            }
+            Err(other) => panic!("expected SchemaValidation, got {other:?}"),
+        }
+    }
+
+    /// Build a batch where the `service` column has nulls interleaved
+    /// with non-null values. Used by [`test_round_trip_preserves_nulls`].
+    fn make_metrics_batch_with_nulls(num_rows: usize) -> RecordBatch {
+        let dict_type = DataType::Dictionary(Box::new(DataType::Int32), Box::new(DataType::Utf8));
+        let schema = Arc::new(ArrowSchema::new(vec![
+            Field::new("metric_name", dict_type.clone(), false),
+            Field::new("metric_type", DataType::UInt8, false),
+            Field::new("timestamp_secs", DataType::UInt64, false),
+            Field::new("value", DataType::Float64, false),
+            Field::new("timeseries_id", DataType::Int64, false),
+            Field::new("service", dict_type, true),
+        ]));
+        let metric_keys: Vec<i32> = (0..num_rows as i32).map(|i| i % 2).collect();
+        let metric_values = StringArray::from(vec!["cpu.usage", "memory.used"]);
+        let metric_name: ArrayRef = Arc::new(
+            DictionaryArray::<Int32Type>::try_new(
+                arrow::array::Int32Array::from(metric_keys),
+                Arc::new(metric_values),
+            )
+            .unwrap(),
+        );
+        let metric_type: ArrayRef = Arc::new(UInt8Array::from(vec![0u8; num_rows]));
+        let timestamps: Vec<u64> = (0..num_rows as u64).map(|i| 1_700_000_000 + i).collect();
+        let timestamp_secs: ArrayRef = Arc::new(UInt64Array::from(timestamps));
+        let values: Vec<f64> = (0..num_rows).map(|i| i as f64).collect();
+        let value: ArrayRef = Arc::new(Float64Array::from(values));
+        let tsids: Vec<i64> = (0..num_rows as i64).map(|i| 1000 + i).collect();
+        let timeseries_id: ArrayRef = Arc::new(Int64Array::from(tsids));
+        // Every third row gets a null service.
+        let svc_keys: Vec<Option<i32>> = (0..num_rows as i32)
+            .map(|i| if i % 3 == 0 { None } else { Some(i % 2) })
+            .collect();
+        let svc_values = StringArray::from(vec!["api", "db"]);
+        let service: ArrayRef = Arc::new(
+            DictionaryArray::<Int32Type>::try_new(
+                arrow::array::Int32Array::from(svc_keys),
+                Arc::new(svc_values),
+            )
+            .unwrap(),
+        );
+        RecordBatch::try_new(
+            schema,
+            vec![
+                metric_name,
+                metric_type,
+                timestamp_secs,
+                value,
+                timeseries_id,
+                service,
+            ],
+        )
+        .unwrap()
+    }
+
+    /// Helper: extract the string value at each row of a column (handles
+    /// both Dictionary(Int32, Utf8) and plain Utf8).
+    fn column_as_strings(col: &ArrayRef) -> Vec<Option<String>> {
+        if let Some(dict) = col.as_any().downcast_ref::<DictionaryArray<Int32Type>>() {
+            let values = dict
+                .values()
+                .as_any()
+                .downcast_ref::<StringArray>()
+                .unwrap();
+            (0..dict.len())
+                .map(|i| {
+                    if dict.is_null(i) {
+                        None
+                    } else {
+                        Some(values.value(dict.keys().value(i) as usize).to_string())
+                    }
+                })
+                .collect()
+        } else if let Some(s) = col.as_any().downcast_ref::<StringArray>() {
+            (0..s.len())
+                .map(|i| {
+                    if s.is_null(i) {
+                        None
+                    } else {
+                        Some(s.value(i).to_string())
+                    }
+                })
+                .collect()
+        } else {
+            panic!(
+                "column_as_strings: unsupported column type {:?}",
+                col.data_type()
+            );
+        }
+    }
+}