diff --git a/.github/workflows/lint-rust.yml b/.github/workflows/lint-rust.yml
index 9e124fd369fe..4fcac3c01040 100644
--- a/.github/workflows/lint-rust.yml
+++ b/.github/workflows/lint-rust.yml
@@ -38,7 +38,8 @@ jobs:
           save-if: ${{ github.ref_name == 'main' }}
 
       - name: Run cargo clippy with all features enabled
-        run: cargo clippy --workspace --all-targets --all-features -- -D warnings
+        # not all features can combine with each other for nano-arrow
+        run: cargo clippy --workspace --all-targets --exclude nano-arrow --all-features -- -D warnings
 
   # Default feature set should compile on the stable toolchain
   clippy-stable:
@@ -58,7 +59,7 @@ jobs:
           save-if: ${{ github.ref_name == 'main' }}
 
       - name: Run cargo clippy
-        run: cargo clippy --workspace --all-targets -- -D warnings
+        run: cargo clippy --workspace --all-targets --exclude nano-arrow -- -D warnings
 
   rustfmt:
     if: github.ref_name != 'main'
diff --git a/Cargo.toml b/Cargo.toml
index 7809758a5f22..a721ff8f095e 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -28,7 +28,7 @@ bytemuck = { version = "1", features = ["derive", "extern_crate_alloc"] }
 chrono = { version = "0.4", default-features = false, features = ["std"] }
 chrono-tz = "0.8.1"
 ciborium = "0.2"
-either = "1.8"
+either = "1.9"
 futures = "0.3.25"
 hashbrown = { version = "0.14", features = ["rayon", "ahash"] }
 indexmap = { version = "2", features = ["std"] }
@@ -50,6 +50,12 @@ strum_macros = "0.25"
 thiserror = "1"
 url = "2.3.1"
 version_check = "0.9.4"
+simdutf8 = "0.1.4"
+hex = "0.4.3"
+base64 = "0.21.2"
+fallible-streaming-iterator = "0.1.9"
+streaming-iterator = "0.1.9"
+
 xxhash-rust = { version = "0.8.6", features = ["xxh3"] }
 polars-core = { version = "0.33.2", path = "crates/polars-core", default-features = false }
 polars-arrow = { version = "0.33.2", path = "crates/polars-arrow", default-features = false }
@@ -69,11 +75,9 @@ polars-json = { version = "0.33.2", path = "crates/polars-json", default-feature
 polars = { version = "0.33.2", path = "crates/polars", default-features = false }
 
 [workspace.dependencies.arrow]
-package = "arrow2"
-# git = "https://github.com/jorgecarleitao/arrow2"
-# rev = "7c93e358fc400bf3c0c0219c22eefc6b38fc2d12"
-# branch = ""
-version = "0.18.0"
+package = "nano-arrow"
+version = "0.1.0"
+path = "crates/nano-arrow"
 default-features = false
 features = [
   "compute_aggregate",
diff --git a/crates/Makefile b/crates/Makefile
index e8271c7ed583..e0e187fc7d21 100644
--- a/crates/Makefile
+++ b/crates/Makefile
@@ -10,11 +10,11 @@ fmt:  ## Run rustfmt and dprint
 
 .PHONY: check
 check:  ## Run cargo check with all features
-	cargo check --workspace --all-targets --all-features
+	cargo check --workspace --all-targets --exclude nano-arrow --all-features
 
 .PHONY: clippy
 clippy:  ## Run clippy with all features
-	cargo clippy --workspace --all-targets --all-features
+	cargo clippy --workspace --all-targets --exclude nano-arrow --all-features
 
 .PHONY: clippy-default
 clippy-default:  ## Run clippy with default features
diff --git a/crates/nano-arrow/Cargo.toml b/crates/nano-arrow/Cargo.toml
new file mode 100644
index 000000000000..29b852d34572
--- /dev/null
+++ b/crates/nano-arrow/Cargo.toml
@@ -0,0 +1,198 @@
+[package]
+name = "nano-arrow"
+version = "0.1.0"
+authors = ["Jorge C. Leitao <jorgecarleitao@gmail.com>", "Apache Arrow <dev@arrow.apache.org>", "Ritchie Vink"]
+edition.workspace = true
+homepage.workspace = true
+licence = "Apache 2.0 and MIT"
+license.workspace = true
+repository.workspace = true
+description = "Minimal implementation of the Arrow specification forked from arrow2."
+
+# See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html
+
+[dependencies]
+bytemuck.workspace = true
+chrono.workspace = true
+# for timezone support
+chrono-tz = { workspace = true, optional = true }
+dyn-clone = "1"
+either.workspace = true
+foreign_vec = "0.1.0"
+hashbrown.workspace = true
+num-traits.workspace = true
+simdutf8.workspace = true
+
+# for decimal i256
+ethnum = "1"
+
+# To efficiently cast numbers to strings
+lexical-core = { version = "0.8", optional = true }
+
+fallible-streaming-iterator = { workspace = true, optional = true }
+regex = { workspace = true, optional = true }
+regex-syntax = { version = "0.7", optional = true }
+streaming-iterator = { workspace = true }
+
+indexmap = { workspace = true, optional = true }
+
+arrow-format = { version = "0.8", optional = true, features = ["ipc"] }
+
+hex = { workspace = true, optional = true }
+
+# for IPC compression
+lz4 = { version = "1.24", optional = true }
+zstd = { version = "0.12", optional = true }
+
+base64 = { workspace = true, optional = true }
+
+# to write to parquet as a stream
+futures = { version = "0.3", optional = true }
+
+# to read IPC as a stream
+async-stream = { version = "0.3.2", optional = true }
+
+# avro support
+avro-schema = { version = "0.3", optional = true }
+
+# for division/remainder optimization at runtime
+strength_reduce = { version = "0.2", optional = true }
+
+# For instruction multiversioning
+multiversion = { workspace = true, optional = true }
+
+# Faster hashing
+ahash.workspace = true
+
+# Support conversion to/from arrow-rs
+arrow-array = { version = ">=40", optional = true }
+arrow-buffer = { version = ">=40", optional = true }
+arrow-data = { version = ">=40", optional = true }
+arrow-schema = { version = ">=40", optional = true }
+
+[target.wasm32-unknown-unknown.dependencies]
+getrandom = { version = "0.2", features = ["js"] }
+
+# parquet support
+[dependencies.parquet2]
+version = "0.17"
+optional = true
+default_features = false
+features = ["async"]
+
+[dev-dependencies]
+avro-rs = { version = "0.13", features = ["snappy"] }
+criterion = "0.4"
+crossbeam-channel = "0.5.1"
+doc-comment = "0.3"
+flate2 = "1"
+# used to run formal property testing
+proptest = { version = "1", default_features = false, features = ["std"] }
+# use for flaky testing
+rand = "0.8"
+# use for generating and testing random data samples
+sample-arrow2 = "0.1"
+sample-std = "0.1"
+sample-test = "0.1"
+# used to test async readers
+tokio = { version = "1", features = ["macros", "rt", "fs", "io-util"] }
+tokio-util = { version = "0.7", features = ["compat"] }
+
+[package.metadata.docs.rs]
+features = ["full"]
+rustdoc-args = ["--cfg", "docsrs"]
+
+[features]
+default = []
+full = [
+  "arrow",
+  "io_ipc",
+  "io_flight",
+  "io_ipc_write_async",
+  "io_ipc_read_async",
+  "io_ipc_compression",
+  "io_parquet",
+  "io_parquet_compression",
+  "io_avro",
+  "io_avro_compression",
+  "io_avro_async",
+  "regex-syntax",
+  "compute",
+  # parses timezones used in timestamp conversions
+  "chrono-tz",
+]
+arrow = ["arrow-buffer", "arrow-schema", "arrow-data", "arrow-array"]
+io_ipc = ["arrow-format"]
+io_ipc_write_async = ["io_ipc", "futures"]
+io_ipc_read_async = ["io_ipc", "futures", "async-stream"]
+io_ipc_compression = ["lz4", "zstd"]
+io_flight = ["io_ipc", "arrow-format/flight-data"]
+
+# base64 + io_ipc because arrow schemas are stored as base64-encoded ipc format.
+io_parquet = ["parquet2", "io_ipc", "base64", "futures", "fallible-streaming-iterator"]
+
+io_parquet_compression = [
+  "io_parquet_zstd",
+  "io_parquet_gzip",
+  "io_parquet_snappy",
+  "io_parquet_lz4",
+  "io_parquet_brotli",
+]
+
+# sample testing of generated arrow data
+io_parquet_sample_test = ["io_parquet"]
+
+# compression backends
+io_parquet_zstd = ["parquet2/zstd"]
+io_parquet_snappy = ["parquet2/snappy"]
+io_parquet_gzip = ["parquet2/gzip"]
+io_parquet_lz4_flex = ["parquet2/lz4_flex"]
+io_parquet_lz4 = ["parquet2/lz4"]
+io_parquet_brotli = ["parquet2/brotli"]
+
+# parquet bloom filter functions
+io_parquet_bloom_filter = ["parquet2/bloom_filter"]
+
+io_avro = ["avro-schema"]
+io_avro_compression = [
+  "avro-schema/compression",
+]
+io_avro_async = ["avro-schema/async"]
+
+# the compute kernels. Disabling this significantly reduces compile time.
+compute_aggregate = ["multiversion"]
+compute_arithmetics_decimal = ["strength_reduce"]
+compute_arithmetics = ["strength_reduce", "compute_arithmetics_decimal"]
+compute_bitwise = []
+compute_boolean = []
+compute_boolean_kleene = []
+compute_cast = ["lexical-core", "compute_take"]
+compute_comparison = ["compute_take", "compute_boolean"]
+compute_concatenate = []
+compute_filter = []
+compute_hash = ["multiversion"]
+compute_if_then_else = []
+compute_take = []
+compute_temporal = []
+compute = [
+  "compute_aggregate",
+  "compute_arithmetics",
+  "compute_bitwise",
+  "compute_boolean",
+  "compute_boolean_kleene",
+  "compute_cast",
+  "compute_comparison",
+  "compute_concatenate",
+  "compute_filter",
+  "compute_hash",
+  "compute_if_then_else",
+  "compute_take",
+  "compute_temporal",
+]
+simd = []
+
+[build-dependencies]
+rustc_version = "0.4.0"
+
+[package.metadata.cargo-all-features]
+allowlist = ["compute", "compute_sort", "compute_hash", "compute_nullif"]
diff --git a/crates/nano-arrow/src/README.md b/crates/nano-arrow/src/README.md
new file mode 100644
index 000000000000..d6371ebc8741
--- /dev/null
+++ b/crates/nano-arrow/src/README.md
@@ -0,0 +1,32 @@
+# Crate's design
+
+This document describes the design of this module, and thus the overall crate.
+Each module MAY have its own design document, that concerns specifics of that module, and if yes,
+it MUST be on each module's `README.md`.
+
+## Equality
+
+Array equality is not defined in the Arrow specification. This crate follows the intent of the specification, but there is no guarantee that this no verification that this equals e.g. C++'s definition.
+
+There is a single source of truth about whether two arrays are equal, and that is via their
+equality operators, defined on the module [`array/equal`](array/equal/mod.rs).
+
+Implementation MUST use these operators for asserting equality, so that all testing follows the same definition of array equality.
+
+## Error handling
+
+- Errors from an external dependency MUST be encapsulated on `External`.
+- Errors from IO MUST be encapsulated on `Io`.
+- This crate MAY return `NotYetImplemented` when the functionality does not exist, or it MAY panic with `unimplemented!`.
+
+## Logical and physical types
+
+There is a strict separation between physical and logical types:
+
+- physical types MUST be implemented via generics
+- logical types MUST be implemented via variables (whose value is e.g. an `enum`)
+- logical types MUST be declared and implemented on the `datatypes` module
+
+## Source of undefined behavior
+
+There is one, and only one, acceptable source of undefined behavior: FFI. It is impossible to prove that data passed via pointers are safe for consumption (only a promise from the specification).
diff --git a/crates/nano-arrow/src/array/README.md b/crates/nano-arrow/src/array/README.md
new file mode 100644
index 000000000000..af21f91e02ef
--- /dev/null
+++ b/crates/nano-arrow/src/array/README.md
@@ -0,0 +1,73 @@
+# Array module
+
+This document describes the overall design of this module.
+
+## Notation:
+
+- "array" in this module denotes any struct that implements the trait `Array`.
+- "mutable array" in this module denotes any struct that implements the trait `MutableArray`.
+- words in `code` denote existing terms on this implementation.
+
+## Arrays:
+
+- Every arrow array with a different physical representation MUST be implemented as a struct or generic struct.
+
+- An array MAY have its own module. E.g. `primitive/mod.rs`
+
+- An array with a null bitmap MUST implement it as `Option<Bitmap>`
+
+- An array MUST be `#[derive(Clone)]`
+
+- The trait `Array` MUST only be implemented by structs in this module.
+
+- Every child array on the struct MUST be `Box<dyn Array>`.
+
+- An array MUST implement `try_new(...) -> Self`. This method MUST error iff
+  the data does not follow the arrow specification, including any sentinel types such as utf8.
+
+- An array MAY implement `unsafe try_new_unchecked` that skips validation steps that are `O(N)`.
+
+- An array MUST implement either `new_empty()` or `new_empty(DataType)` that returns a zero-len of `Self`.
+
+- An array MUST implement either `new_null(length: usize)` or `new_null(DataType, length: usize)` that returns a valid array of length `length` whose all elements are null.
+
+- An array MAY implement `value(i: usize)` that returns the value at slot `i` ignoring the validity bitmap.
+
+- functions to create new arrays from native Rust SHOULD be named as follows:
+  - `from`: from a slice of optional values (e.g. `AsRef<[Option<bool>]` for `BooleanArray`)
+  - `from_slice`: from a slice of values (e.g. `AsRef<[bool]>` for `BooleanArray`)
+  - `from_trusted_len_iter` from an iterator of trusted len of optional values
+  - `from_trusted_len_values_iter` from an iterator of trusted len of values
+  - `try_from_trusted_len_iter` from an fallible iterator of trusted len of optional values
+
+### Slot offsets
+
+- An array MUST have a `offset: usize` measuring the number of slots that the array is currently offsetted by if the specification requires.
+
+- An array MUST implement `fn slice(&self, offset: usize, length: usize) -> Self` that returns an offsetted and/or truncated clone of the array. This function MUST increase the array's offset if it exists.
+
+- Conversely, `offset` MUST only be changed by `slice`.
+
+The rational of the above is that it enable us to be fully interoperable with the offset logic supported by the C data interface, while at the same time easily perform array slices
+within Rust's type safety mechanism.
+
+### Mutable Arrays
+
+- An array MAY have a mutable counterpart. E.g. `MutablePrimitiveArray<T>` is the mutable counterpart of `PrimitiveArray<T>`.
+
+- Arrays with mutable counterparts MUST have its own module, and have the mutable counterpart declared in `{module}/mutable.rs`.
+
+- The trait `MutableArray` MUST only be implemented by mutable arrays in this module.
+
+- A mutable array MUST be `#[derive(Debug)]`
+
+- A mutable array with a null bitmap MUST implement it as `Option<MutableBitmap>`
+
+- Converting a `MutableArray` to its immutable counterpart MUST be `O(1)`. Specifically:
+  - it must not allocate
+  - it must not cause `O(N)` data transformations
+
+  This is achieved by converting mutable versions to immutable counterparts (e.g. `MutableBitmap -> Bitmap`).
+
+  The rational is that `MutableArray`s can be used to perform in-place operations under
+  the arrow spec.
diff --git a/crates/nano-arrow/src/array/binary/data.rs b/crates/nano-arrow/src/array/binary/data.rs
new file mode 100644
index 000000000000..56835dec0c42
--- /dev/null
+++ b/crates/nano-arrow/src/array/binary/data.rs
@@ -0,0 +1,43 @@
+use arrow_data::{ArrayData, ArrayDataBuilder};
+
+use crate::array::{Arrow2Arrow, BinaryArray};
+use crate::bitmap::Bitmap;
+use crate::offset::{Offset, OffsetsBuffer};
+
+impl<O: Offset> Arrow2Arrow for BinaryArray<O> {
+    fn to_data(&self) -> ArrayData {
+        let data_type = self.data_type.clone().into();
+        let builder = ArrayDataBuilder::new(data_type)
+            .len(self.offsets().len_proxy())
+            .buffers(vec![
+                self.offsets.clone().into_inner().into(),
+                self.values.clone().into(),
+            ])
+            .nulls(self.validity.as_ref().map(|b| b.clone().into()));
+
+        // Safety: Array is valid
+        unsafe { builder.build_unchecked() }
+    }
+
+    fn from_data(data: &ArrayData) -> Self {
+        let data_type = data.data_type().clone().into();
+
+        if data.is_empty() {
+            // Handle empty offsets
+            return Self::new_empty(data_type);
+        }
+
+        let buffers = data.buffers();
+
+        // Safety: ArrayData is valid
+        let mut offsets = unsafe { OffsetsBuffer::new_unchecked(buffers[0].clone().into()) };
+        offsets.slice(data.offset(), data.len() + 1);
+
+        Self {
+            data_type,
+            offsets,
+            values: buffers[1].clone().into(),
+            validity: data.nulls().map(|n| Bitmap::from_null_buffer(n.clone())),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/array/binary/ffi.rs b/crates/nano-arrow/src/array/binary/ffi.rs
new file mode 100644
index 000000000000..3ba66cc130da
--- /dev/null
+++ b/crates/nano-arrow/src/array/binary/ffi.rs
@@ -0,0 +1,63 @@
+use super::BinaryArray;
+use crate::array::{FromFfi, ToFfi};
+use crate::bitmap::align;
+use crate::error::Result;
+use crate::ffi;
+use crate::offset::{Offset, OffsetsBuffer};
+
+unsafe impl<O: Offset> ToFfi for BinaryArray<O> {
+    fn buffers(&self) -> Vec<Option<*const u8>> {
+        vec![
+            self.validity.as_ref().map(|x| x.as_ptr()),
+            Some(self.offsets.buffer().as_ptr().cast::<u8>()),
+            Some(self.values.as_ptr().cast::<u8>()),
+        ]
+    }
+
+    fn offset(&self) -> Option<usize> {
+        let offset = self.offsets.buffer().offset();
+        if let Some(bitmap) = self.validity.as_ref() {
+            if bitmap.offset() == offset {
+                Some(offset)
+            } else {
+                None
+            }
+        } else {
+            Some(offset)
+        }
+    }
+
+    fn to_ffi_aligned(&self) -> Self {
+        let offset = self.offsets.buffer().offset();
+
+        let validity = self.validity.as_ref().map(|bitmap| {
+            if bitmap.offset() == offset {
+                bitmap.clone()
+            } else {
+                align(bitmap, offset)
+            }
+        });
+
+        Self {
+            data_type: self.data_type.clone(),
+            validity,
+            offsets: self.offsets.clone(),
+            values: self.values.clone(),
+        }
+    }
+}
+
+impl<O: Offset, A: ffi::ArrowArrayRef> FromFfi<A> for BinaryArray<O> {
+    unsafe fn try_from_ffi(array: A) -> Result<Self> {
+        let data_type = array.data_type().clone();
+
+        let validity = unsafe { array.validity() }?;
+        let offsets = unsafe { array.buffer::<O>(1) }?;
+        let values = unsafe { array.buffer::<u8>(2) }?;
+
+        // assumption that data from FFI is well constructed
+        let offsets = unsafe { OffsetsBuffer::new_unchecked(offsets) };
+
+        Ok(Self::new(data_type, offsets, values, validity))
+    }
+}
diff --git a/crates/nano-arrow/src/array/binary/fmt.rs b/crates/nano-arrow/src/array/binary/fmt.rs
new file mode 100644
index 000000000000..d2a6788ce4d8
--- /dev/null
+++ b/crates/nano-arrow/src/array/binary/fmt.rs
@@ -0,0 +1,26 @@
+use std::fmt::{Debug, Formatter, Result, Write};
+
+use super::super::fmt::write_vec;
+use super::BinaryArray;
+use crate::offset::Offset;
+
+pub fn write_value<O: Offset, W: Write>(array: &BinaryArray<O>, index: usize, f: &mut W) -> Result {
+    let bytes = array.value(index);
+    let writer = |f: &mut W, index| write!(f, "{}", bytes[index]);
+
+    write_vec(f, writer, None, bytes.len(), "None", false)
+}
+
+impl<O: Offset> Debug for BinaryArray<O> {
+    fn fmt(&self, f: &mut Formatter<'_>) -> Result {
+        let writer = |f: &mut Formatter, index| write_value(self, index, f);
+
+        let head = if O::IS_LARGE {
+            "LargeBinaryArray"
+        } else {
+            "BinaryArray"
+        };
+        write!(f, "{head}")?;
+        write_vec(f, writer, self.validity(), self.len(), "None", false)
+    }
+}
diff --git a/crates/nano-arrow/src/array/binary/from.rs b/crates/nano-arrow/src/array/binary/from.rs
new file mode 100644
index 000000000000..73df03531594
--- /dev/null
+++ b/crates/nano-arrow/src/array/binary/from.rs
@@ -0,0 +1,11 @@
+use std::iter::FromIterator;
+
+use super::{BinaryArray, MutableBinaryArray};
+use crate::offset::Offset;
+
+impl<O: Offset, P: AsRef<[u8]>> FromIterator<Option<P>> for BinaryArray<O> {
+    #[inline]
+    fn from_iter<I: IntoIterator<Item = Option<P>>>(iter: I) -> Self {
+        MutableBinaryArray::<O>::from_iter(iter).into()
+    }
+}
diff --git a/crates/nano-arrow/src/array/binary/iterator.rs b/crates/nano-arrow/src/array/binary/iterator.rs
new file mode 100644
index 000000000000..3fccec58eb50
--- /dev/null
+++ b/crates/nano-arrow/src/array/binary/iterator.rs
@@ -0,0 +1,42 @@
+use super::{BinaryArray, MutableBinaryValuesArray};
+use crate::array::{ArrayAccessor, ArrayValuesIter};
+use crate::bitmap::utils::{BitmapIter, ZipValidity};
+use crate::offset::Offset;
+
+unsafe impl<'a, O: Offset> ArrayAccessor<'a> for BinaryArray<O> {
+    type Item = &'a [u8];
+
+    #[inline]
+    unsafe fn value_unchecked(&'a self, index: usize) -> Self::Item {
+        self.value_unchecked(index)
+    }
+
+    #[inline]
+    fn len(&self) -> usize {
+        self.len()
+    }
+}
+
+/// Iterator of values of an [`BinaryArray`].
+pub type BinaryValueIter<'a, O> = ArrayValuesIter<'a, BinaryArray<O>>;
+
+impl<'a, O: Offset> IntoIterator for &'a BinaryArray<O> {
+    type Item = Option<&'a [u8]>;
+    type IntoIter = ZipValidity<&'a [u8], BinaryValueIter<'a, O>, BitmapIter<'a>>;
+
+    fn into_iter(self) -> Self::IntoIter {
+        self.iter()
+    }
+}
+
+/// Iterator of values of an [`MutableBinaryValuesArray`].
+pub type MutableBinaryValuesIter<'a, O> = ArrayValuesIter<'a, MutableBinaryValuesArray<O>>;
+
+impl<'a, O: Offset> IntoIterator for &'a MutableBinaryValuesArray<O> {
+    type Item = &'a [u8];
+    type IntoIter = MutableBinaryValuesIter<'a, O>;
+
+    fn into_iter(self) -> Self::IntoIter {
+        self.iter()
+    }
+}
diff --git a/crates/nano-arrow/src/array/binary/mod.rs b/crates/nano-arrow/src/array/binary/mod.rs
new file mode 100644
index 000000000000..ccd58f22d869
--- /dev/null
+++ b/crates/nano-arrow/src/array/binary/mod.rs
@@ -0,0 +1,423 @@
+use either::Either;
+
+use super::specification::try_check_offsets_bounds;
+use super::{Array, GenericBinaryArray};
+use crate::bitmap::utils::{BitmapIter, ZipValidity};
+use crate::bitmap::Bitmap;
+use crate::buffer::Buffer;
+use crate::datatypes::DataType;
+use crate::error::Error;
+use crate::offset::{Offset, Offsets, OffsetsBuffer};
+use crate::trusted_len::TrustedLen;
+
+mod ffi;
+pub(super) mod fmt;
+mod iterator;
+pub use iterator::*;
+mod from;
+mod mutable_values;
+pub use mutable_values::*;
+mod mutable;
+pub use mutable::*;
+
+#[cfg(feature = "arrow")]
+mod data;
+
+/// A [`BinaryArray`] is Arrow's semantically equivalent of an immutable `Vec<Option<Vec<u8>>>`.
+/// It implements [`Array`].
+///
+/// The size of this struct is `O(1)`, as all data is stored behind an [`std::sync::Arc`].
+/// # Example
+/// ```
+/// use arrow2::array::BinaryArray;
+/// use arrow2::bitmap::Bitmap;
+/// use arrow2::buffer::Buffer;
+///
+/// let array = BinaryArray::<i32>::from([Some([1, 2].as_ref()), None, Some([3].as_ref())]);
+/// assert_eq!(array.value(0), &[1, 2]);
+/// assert_eq!(array.iter().collect::<Vec<_>>(), vec![Some([1, 2].as_ref()), None, Some([3].as_ref())]);
+/// assert_eq!(array.values_iter().collect::<Vec<_>>(), vec![[1, 2].as_ref(), &[], &[3]]);
+/// // the underlying representation:
+/// assert_eq!(array.values(), &Buffer::from(vec![1, 2, 3]));
+/// assert_eq!(array.offsets().buffer(), &Buffer::from(vec![0, 2, 2, 3]));
+/// assert_eq!(array.validity(), Some(&Bitmap::from([true, false, true])));
+/// ```
+///
+/// # Generic parameter
+/// The generic parameter [`Offset`] can only be `i32` or `i64` and tradeoffs maximum array length with
+/// memory usage:
+/// * the sum of lengths of all elements cannot exceed `Offset::MAX`
+/// * the total size of the underlying data is `array.len() * size_of::<Offset>() + sum of lengths of all elements`
+///
+/// # Safety
+/// The following invariants hold:
+/// * Two consecutives `offsets` casted (`as`) to `usize` are valid slices of `values`.
+/// * `len` is equal to `validity.len()`, when defined.
+#[derive(Clone)]
+pub struct BinaryArray<O: Offset> {
+    data_type: DataType,
+    offsets: OffsetsBuffer<O>,
+    values: Buffer<u8>,
+    validity: Option<Bitmap>,
+}
+
+impl<O: Offset> BinaryArray<O> {
+    /// Returns a [`BinaryArray`] created from its internal representation.
+    ///
+    /// # Errors
+    /// This function returns an error iff:
+    /// * The last offset is not equal to the values' length.
+    /// * the validity's length is not equal to `offsets.len()`.
+    /// * The `data_type`'s [`crate::datatypes::PhysicalType`] is not equal to either `Binary` or `LargeBinary`.
+    /// # Implementation
+    /// This function is `O(1)`
+    pub fn try_new(
+        data_type: DataType,
+        offsets: OffsetsBuffer<O>,
+        values: Buffer<u8>,
+        validity: Option<Bitmap>,
+    ) -> Result<Self, Error> {
+        try_check_offsets_bounds(&offsets, values.len())?;
+
+        if validity
+            .as_ref()
+            .map_or(false, |validity| validity.len() != offsets.len_proxy())
+        {
+            return Err(Error::oos(
+                "validity mask length must match the number of values",
+            ));
+        }
+
+        if data_type.to_physical_type() != Self::default_data_type().to_physical_type() {
+            return Err(Error::oos(
+                "BinaryArray can only be initialized with DataType::Binary or DataType::LargeBinary",
+            ));
+        }
+
+        Ok(Self {
+            data_type,
+            offsets,
+            values,
+            validity,
+        })
+    }
+
+    /// Creates a new [`BinaryArray`] from slices of `&[u8]`.
+    pub fn from_slice<T: AsRef<[u8]>, P: AsRef<[T]>>(slice: P) -> Self {
+        Self::from_trusted_len_values_iter(slice.as_ref().iter())
+    }
+
+    /// Creates a new [`BinaryArray`] from a slice of optional `&[u8]`.
+    // Note: this can't be `impl From` because Rust does not allow double `AsRef` on it.
+    pub fn from<T: AsRef<[u8]>, P: AsRef<[Option<T>]>>(slice: P) -> Self {
+        MutableBinaryArray::<O>::from(slice).into()
+    }
+
+    /// Returns an iterator of `Option<&[u8]>` over every element of this array.
+    pub fn iter(&self) -> ZipValidity<&[u8], BinaryValueIter<O>, BitmapIter> {
+        ZipValidity::new_with_validity(self.values_iter(), self.validity.as_ref())
+    }
+
+    /// Returns an iterator of `&[u8]` over every element of this array, ignoring the validity
+    pub fn values_iter(&self) -> BinaryValueIter<O> {
+        BinaryValueIter::new(self)
+    }
+
+    /// Returns the length of this array
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.offsets.len_proxy()
+    }
+
+    /// Returns the element at index `i`
+    /// # Panics
+    /// iff `i >= self.len()`
+    #[inline]
+    pub fn value(&self, i: usize) -> &[u8] {
+        assert!(i < self.len());
+        unsafe { self.value_unchecked(i) }
+    }
+
+    /// Returns the element at index `i`
+    /// # Safety
+    /// Assumes that the `i < self.len`.
+    #[inline]
+    pub unsafe fn value_unchecked(&self, i: usize) -> &[u8] {
+        // soundness: the invariant of the function
+        let (start, end) = self.offsets.start_end_unchecked(i);
+
+        // soundness: the invariant of the struct
+        self.values.get_unchecked(start..end)
+    }
+
+    /// Returns the element at index `i` or `None` if it is null
+    /// # Panics
+    /// iff `i >= self.len()`
+    #[inline]
+    pub fn get(&self, i: usize) -> Option<&[u8]> {
+        if !self.is_null(i) {
+            // soundness: Array::is_null panics if i >= self.len
+            unsafe { Some(self.value_unchecked(i)) }
+        } else {
+            None
+        }
+    }
+
+    /// Returns the [`DataType`] of this array.
+    #[inline]
+    pub fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    /// Returns the values of this [`BinaryArray`].
+    #[inline]
+    pub fn values(&self) -> &Buffer<u8> {
+        &self.values
+    }
+
+    /// Returns the offsets of this [`BinaryArray`].
+    #[inline]
+    pub fn offsets(&self) -> &OffsetsBuffer<O> {
+        &self.offsets
+    }
+
+    /// The optional validity.
+    #[inline]
+    pub fn validity(&self) -> Option<&Bitmap> {
+        self.validity.as_ref()
+    }
+
+    /// Slices this [`BinaryArray`].
+    /// # Implementation
+    /// This function is `O(1)`.
+    /// # Panics
+    /// iff `offset + length > self.len()`.
+    pub fn slice(&mut self, offset: usize, length: usize) {
+        assert!(
+            offset + length <= self.len(),
+            "the offset of the new Buffer cannot exceed the existing length"
+        );
+        unsafe { self.slice_unchecked(offset, length) }
+    }
+
+    /// Slices this [`BinaryArray`].
+    /// # Implementation
+    /// This function is `O(1)`.
+    /// # Safety
+    /// The caller must ensure that `offset + length <= self.len()`.
+    pub unsafe fn slice_unchecked(&mut self, offset: usize, length: usize) {
+        self.validity.as_mut().and_then(|bitmap| {
+            bitmap.slice_unchecked(offset, length);
+            (bitmap.unset_bits() > 0).then(|| bitmap)
+        });
+        self.offsets.slice_unchecked(offset, length + 1);
+    }
+
+    impl_sliced!();
+    impl_mut_validity!();
+    impl_into_array!();
+
+    /// Returns its internal representation
+    #[must_use]
+    pub fn into_inner(self) -> (DataType, OffsetsBuffer<O>, Buffer<u8>, Option<Bitmap>) {
+        let Self {
+            data_type,
+            offsets,
+            values,
+            validity,
+        } = self;
+        (data_type, offsets, values, validity)
+    }
+
+    /// Try to convert this `BinaryArray` to a `MutableBinaryArray`
+    #[must_use]
+    pub fn into_mut(self) -> Either<Self, MutableBinaryArray<O>> {
+        use Either::*;
+        if let Some(bitmap) = self.validity {
+            match bitmap.into_mut() {
+                // Safety: invariants are preserved
+                Left(bitmap) => Left(BinaryArray::new(
+                    self.data_type,
+                    self.offsets,
+                    self.values,
+                    Some(bitmap),
+                )),
+                Right(mutable_bitmap) => match (self.values.into_mut(), self.offsets.into_mut()) {
+                    (Left(values), Left(offsets)) => Left(BinaryArray::new(
+                        self.data_type,
+                        offsets,
+                        values,
+                        Some(mutable_bitmap.into()),
+                    )),
+                    (Left(values), Right(offsets)) => Left(BinaryArray::new(
+                        self.data_type,
+                        offsets.into(),
+                        values,
+                        Some(mutable_bitmap.into()),
+                    )),
+                    (Right(values), Left(offsets)) => Left(BinaryArray::new(
+                        self.data_type,
+                        offsets,
+                        values.into(),
+                        Some(mutable_bitmap.into()),
+                    )),
+                    (Right(values), Right(offsets)) => Right(
+                        MutableBinaryArray::try_new(
+                            self.data_type,
+                            offsets,
+                            values,
+                            Some(mutable_bitmap),
+                        )
+                        .unwrap(),
+                    ),
+                },
+            }
+        } else {
+            match (self.values.into_mut(), self.offsets.into_mut()) {
+                (Left(values), Left(offsets)) => {
+                    Left(BinaryArray::new(self.data_type, offsets, values, None))
+                },
+                (Left(values), Right(offsets)) => Left(BinaryArray::new(
+                    self.data_type,
+                    offsets.into(),
+                    values,
+                    None,
+                )),
+                (Right(values), Left(offsets)) => Left(BinaryArray::new(
+                    self.data_type,
+                    offsets,
+                    values.into(),
+                    None,
+                )),
+                (Right(values), Right(offsets)) => Right(
+                    MutableBinaryArray::try_new(self.data_type, offsets, values, None).unwrap(),
+                ),
+            }
+        }
+    }
+
+    /// Creates an empty [`BinaryArray`], i.e. whose `.len` is zero.
+    pub fn new_empty(data_type: DataType) -> Self {
+        Self::new(data_type, OffsetsBuffer::new(), Buffer::new(), None)
+    }
+
+    /// Creates an null [`BinaryArray`], i.e. whose `.null_count() == .len()`.
+    #[inline]
+    pub fn new_null(data_type: DataType, length: usize) -> Self {
+        Self::new(
+            data_type,
+            Offsets::new_zeroed(length).into(),
+            Buffer::new(),
+            Some(Bitmap::new_zeroed(length)),
+        )
+    }
+
+    /// Returns the default [`DataType`], `DataType::Binary` or `DataType::LargeBinary`
+    pub fn default_data_type() -> DataType {
+        if O::IS_LARGE {
+            DataType::LargeBinary
+        } else {
+            DataType::Binary
+        }
+    }
+
+    /// Alias for unwrapping [`Self::try_new`]
+    pub fn new(
+        data_type: DataType,
+        offsets: OffsetsBuffer<O>,
+        values: Buffer<u8>,
+        validity: Option<Bitmap>,
+    ) -> Self {
+        Self::try_new(data_type, offsets, values, validity).unwrap()
+    }
+
+    /// Returns a [`BinaryArray`] from an iterator of trusted length.
+    ///
+    /// The [`BinaryArray`] is guaranteed to not have a validity
+    #[inline]
+    pub fn from_trusted_len_values_iter<T: AsRef<[u8]>, I: TrustedLen<Item = T>>(
+        iterator: I,
+    ) -> Self {
+        MutableBinaryArray::<O>::from_trusted_len_values_iter(iterator).into()
+    }
+
+    /// Returns a new [`BinaryArray`] from a [`Iterator`] of `&[u8]`.
+    ///
+    /// The [`BinaryArray`] is guaranteed to not have a validity
+    pub fn from_iter_values<T: AsRef<[u8]>, I: Iterator<Item = T>>(iterator: I) -> Self {
+        MutableBinaryArray::<O>::from_iter_values(iterator).into()
+    }
+
+    /// Creates a [`BinaryArray`] from an iterator of trusted length.
+    /// # Safety
+    /// The iterator must be [`TrustedLen`](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+    /// I.e. that `size_hint().1` correctly reports its length.
+    #[inline]
+    pub unsafe fn from_trusted_len_iter_unchecked<I, P>(iterator: I) -> Self
+    where
+        P: AsRef<[u8]>,
+        I: Iterator<Item = Option<P>>,
+    {
+        MutableBinaryArray::<O>::from_trusted_len_iter_unchecked(iterator).into()
+    }
+
+    /// Creates a [`BinaryArray`] from a [`TrustedLen`]
+    #[inline]
+    pub fn from_trusted_len_iter<I, P>(iterator: I) -> Self
+    where
+        P: AsRef<[u8]>,
+        I: TrustedLen<Item = Option<P>>,
+    {
+        // soundness: I is `TrustedLen`
+        unsafe { Self::from_trusted_len_iter_unchecked(iterator) }
+    }
+
+    /// Creates a [`BinaryArray`] from an falible iterator of trusted length.
+    /// # Safety
+    /// The iterator must be [`TrustedLen`](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+    /// I.e. that `size_hint().1` correctly reports its length.
+    #[inline]
+    pub unsafe fn try_from_trusted_len_iter_unchecked<E, I, P>(iterator: I) -> Result<Self, E>
+    where
+        P: AsRef<[u8]>,
+        I: IntoIterator<Item = Result<Option<P>, E>>,
+    {
+        MutableBinaryArray::<O>::try_from_trusted_len_iter_unchecked(iterator).map(|x| x.into())
+    }
+
+    /// Creates a [`BinaryArray`] from an fallible iterator of trusted length.
+    #[inline]
+    pub fn try_from_trusted_len_iter<E, I, P>(iter: I) -> Result<Self, E>
+    where
+        P: AsRef<[u8]>,
+        I: TrustedLen<Item = Result<Option<P>, E>>,
+    {
+        // soundness: I: TrustedLen
+        unsafe { Self::try_from_trusted_len_iter_unchecked(iter) }
+    }
+}
+
+impl<O: Offset> Array for BinaryArray<O> {
+    impl_common_array!();
+
+    fn validity(&self) -> Option<&Bitmap> {
+        self.validity.as_ref()
+    }
+
+    #[inline]
+    fn with_validity(&self, validity: Option<Bitmap>) -> Box<dyn Array> {
+        Box::new(self.clone().with_validity(validity))
+    }
+}
+
+unsafe impl<O: Offset> GenericBinaryArray<O> for BinaryArray<O> {
+    #[inline]
+    fn values(&self) -> &[u8] {
+        self.values()
+    }
+
+    #[inline]
+    fn offsets(&self) -> &[O] {
+        self.offsets().buffer()
+    }
+}
diff --git a/crates/nano-arrow/src/array/binary/mutable.rs b/crates/nano-arrow/src/array/binary/mutable.rs
new file mode 100644
index 000000000000..92521b400323
--- /dev/null
+++ b/crates/nano-arrow/src/array/binary/mutable.rs
@@ -0,0 +1,469 @@
+use std::iter::FromIterator;
+use std::sync::Arc;
+
+use super::{BinaryArray, MutableBinaryValuesArray, MutableBinaryValuesIter};
+use crate::array::physical_binary::*;
+use crate::array::{Array, MutableArray, TryExtend, TryExtendFromSelf, TryPush};
+use crate::bitmap::utils::{BitmapIter, ZipValidity};
+use crate::bitmap::{Bitmap, MutableBitmap};
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+use crate::offset::{Offset, Offsets};
+use crate::trusted_len::TrustedLen;
+
+/// The Arrow's equivalent to `Vec<Option<Vec<u8>>>`.
+/// Converting a [`MutableBinaryArray`] into a [`BinaryArray`] is `O(1)`.
+/// # Implementation
+/// This struct does not allocate a validity until one is required (i.e. push a null to it).
+#[derive(Debug, Clone)]
+pub struct MutableBinaryArray<O: Offset> {
+    values: MutableBinaryValuesArray<O>,
+    validity: Option<MutableBitmap>,
+}
+
+impl<O: Offset> From<MutableBinaryArray<O>> for BinaryArray<O> {
+    fn from(other: MutableBinaryArray<O>) -> Self {
+        let validity = other.validity.and_then(|x| {
+            let validity: Option<Bitmap> = x.into();
+            validity
+        });
+        let array: BinaryArray<O> = other.values.into();
+        array.with_validity(validity)
+    }
+}
+
+impl<O: Offset> Default for MutableBinaryArray<O> {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl<O: Offset> MutableBinaryArray<O> {
+    /// Creates a new empty [`MutableBinaryArray`].
+    /// # Implementation
+    /// This allocates a [`Vec`] of one element
+    pub fn new() -> Self {
+        Self::with_capacity(0)
+    }
+
+    /// Returns a [`MutableBinaryArray`] created from its internal representation.
+    ///
+    /// # Errors
+    /// This function returns an error iff:
+    /// * The last offset is not equal to the values' length.
+    /// * the validity's length is not equal to `offsets.len()`.
+    /// * The `data_type`'s [`crate::datatypes::PhysicalType`] is not equal to either `Binary` or `LargeBinary`.
+    /// # Implementation
+    /// This function is `O(1)`
+    pub fn try_new(
+        data_type: DataType,
+        offsets: Offsets<O>,
+        values: Vec<u8>,
+        validity: Option<MutableBitmap>,
+    ) -> Result<Self> {
+        let values = MutableBinaryValuesArray::try_new(data_type, offsets, values)?;
+
+        if validity
+            .as_ref()
+            .map_or(false, |validity| validity.len() != values.len())
+        {
+            return Err(Error::oos(
+                "validity's length must be equal to the number of values",
+            ));
+        }
+
+        Ok(Self { values, validity })
+    }
+
+    /// Creates a new [`MutableBinaryArray`] from a slice of optional `&[u8]`.
+    // Note: this can't be `impl From` because Rust does not allow double `AsRef` on it.
+    pub fn from<T: AsRef<[u8]>, P: AsRef<[Option<T>]>>(slice: P) -> Self {
+        Self::from_trusted_len_iter(slice.as_ref().iter().map(|x| x.as_ref()))
+    }
+
+    fn default_data_type() -> DataType {
+        BinaryArray::<O>::default_data_type()
+    }
+
+    /// Initializes a new [`MutableBinaryArray`] with a pre-allocated capacity of slots.
+    pub fn with_capacity(capacity: usize) -> Self {
+        Self::with_capacities(capacity, 0)
+    }
+
+    /// Initializes a new [`MutableBinaryArray`] with a pre-allocated capacity of slots and values.
+    /// # Implementation
+    /// This does not allocate the validity.
+    pub fn with_capacities(capacity: usize, values: usize) -> Self {
+        Self {
+            values: MutableBinaryValuesArray::with_capacities(capacity, values),
+            validity: None,
+        }
+    }
+
+    /// Reserves `additional` elements and `additional_values` on the values buffer.
+    pub fn reserve(&mut self, additional: usize, additional_values: usize) {
+        self.values.reserve(additional, additional_values);
+        if let Some(x) = self.validity.as_mut() {
+            x.reserve(additional)
+        }
+    }
+
+    /// Pushes a new element to the array.
+    /// # Panic
+    /// This operation panics iff the length of all values (in bytes) exceeds `O` maximum value.
+    pub fn push<T: AsRef<[u8]>>(&mut self, value: Option<T>) {
+        self.try_push(value).unwrap()
+    }
+
+    /// Pop the last entry from [`MutableBinaryArray`].
+    /// This function returns `None` iff this array is empty
+    pub fn pop(&mut self) -> Option<Vec<u8>> {
+        let value = self.values.pop()?;
+        self.validity
+            .as_mut()
+            .map(|x| x.pop()?.then(|| ()))
+            .unwrap_or_else(|| Some(()))
+            .map(|_| value)
+    }
+
+    fn try_from_iter<P: AsRef<[u8]>, I: IntoIterator<Item = Option<P>>>(iter: I) -> Result<Self> {
+        let iterator = iter.into_iter();
+        let (lower, _) = iterator.size_hint();
+        let mut primitive = Self::with_capacity(lower);
+        for item in iterator {
+            primitive.try_push(item.as_ref())?
+        }
+        Ok(primitive)
+    }
+
+    fn init_validity(&mut self) {
+        let mut validity = MutableBitmap::with_capacity(self.values.capacity());
+        validity.extend_constant(self.len(), true);
+        validity.set(self.len() - 1, false);
+        self.validity = Some(validity);
+    }
+
+    /// Converts itself into an [`Array`].
+    pub fn into_arc(self) -> Arc<dyn Array> {
+        let a: BinaryArray<O> = self.into();
+        Arc::new(a)
+    }
+
+    /// Shrinks the capacity of the [`MutableBinaryArray`] to fit its current length.
+    pub fn shrink_to_fit(&mut self) {
+        self.values.shrink_to_fit();
+        if let Some(validity) = &mut self.validity {
+            validity.shrink_to_fit()
+        }
+    }
+
+    impl_mutable_array_mut_validity!();
+}
+
+impl<O: Offset> MutableBinaryArray<O> {
+    /// returns its values.
+    pub fn values(&self) -> &Vec<u8> {
+        self.values.values()
+    }
+
+    /// returns its offsets.
+    pub fn offsets(&self) -> &Offsets<O> {
+        self.values.offsets()
+    }
+
+    /// Returns an iterator of `Option<&[u8]>`
+    pub fn iter(&self) -> ZipValidity<&[u8], MutableBinaryValuesIter<O>, BitmapIter> {
+        ZipValidity::new(self.values_iter(), self.validity.as_ref().map(|x| x.iter()))
+    }
+
+    /// Returns an iterator over the values of this array
+    pub fn values_iter(&self) -> MutableBinaryValuesIter<O> {
+        self.values.iter()
+    }
+}
+
+impl<O: Offset> MutableArray for MutableBinaryArray<O> {
+    fn len(&self) -> usize {
+        self.values.len()
+    }
+
+    fn validity(&self) -> Option<&MutableBitmap> {
+        self.validity.as_ref()
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        let array: BinaryArray<O> = std::mem::take(self).into();
+        array.boxed()
+    }
+
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        let array: BinaryArray<O> = std::mem::take(self).into();
+        array.arced()
+    }
+
+    fn data_type(&self) -> &DataType {
+        self.values.data_type()
+    }
+
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    fn as_mut_any(&mut self) -> &mut dyn std::any::Any {
+        self
+    }
+
+    #[inline]
+    fn push_null(&mut self) {
+        self.push::<&[u8]>(None)
+    }
+
+    fn reserve(&mut self, additional: usize) {
+        self.reserve(additional, 0)
+    }
+
+    fn shrink_to_fit(&mut self) {
+        self.shrink_to_fit()
+    }
+}
+
+impl<O: Offset, P: AsRef<[u8]>> FromIterator<Option<P>> for MutableBinaryArray<O> {
+    fn from_iter<I: IntoIterator<Item = Option<P>>>(iter: I) -> Self {
+        Self::try_from_iter(iter).unwrap()
+    }
+}
+
+impl<O: Offset> MutableBinaryArray<O> {
+    /// Creates a [`MutableBinaryArray`] from an iterator of trusted length.
+    /// # Safety
+    /// The iterator must be [`TrustedLen`](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+    /// I.e. that `size_hint().1` correctly reports its length.
+    #[inline]
+    pub unsafe fn from_trusted_len_iter_unchecked<I, P>(iterator: I) -> Self
+    where
+        P: AsRef<[u8]>,
+        I: Iterator<Item = Option<P>>,
+    {
+        let (validity, offsets, values) = trusted_len_unzip(iterator);
+
+        Self::try_new(Self::default_data_type(), offsets, values, validity).unwrap()
+    }
+
+    /// Creates a [`MutableBinaryArray`] from an iterator of trusted length.
+    #[inline]
+    pub fn from_trusted_len_iter<I, P>(iterator: I) -> Self
+    where
+        P: AsRef<[u8]>,
+        I: TrustedLen<Item = Option<P>>,
+    {
+        // soundness: I is `TrustedLen`
+        unsafe { Self::from_trusted_len_iter_unchecked(iterator) }
+    }
+
+    /// Creates a new [`BinaryArray`] from a [`TrustedLen`] of `&[u8]`.
+    /// # Safety
+    /// The iterator must be [`TrustedLen`](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+    /// I.e. that `size_hint().1` correctly reports its length.
+    #[inline]
+    pub unsafe fn from_trusted_len_values_iter_unchecked<T: AsRef<[u8]>, I: Iterator<Item = T>>(
+        iterator: I,
+    ) -> Self {
+        let (offsets, values) = trusted_len_values_iter(iterator);
+        Self::try_new(Self::default_data_type(), offsets, values, None).unwrap()
+    }
+
+    /// Creates a new [`BinaryArray`] from a [`TrustedLen`] of `&[u8]`.
+    #[inline]
+    pub fn from_trusted_len_values_iter<T: AsRef<[u8]>, I: TrustedLen<Item = T>>(
+        iterator: I,
+    ) -> Self {
+        // soundness: I is `TrustedLen`
+        unsafe { Self::from_trusted_len_values_iter_unchecked(iterator) }
+    }
+
+    /// Creates a [`MutableBinaryArray`] from an falible iterator of trusted length.
+    /// # Safety
+    /// The iterator must be [`TrustedLen`](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+    /// I.e. that `size_hint().1` correctly reports its length.
+    #[inline]
+    pub unsafe fn try_from_trusted_len_iter_unchecked<E, I, P>(
+        iterator: I,
+    ) -> std::result::Result<Self, E>
+    where
+        P: AsRef<[u8]>,
+        I: IntoIterator<Item = std::result::Result<Option<P>, E>>,
+    {
+        let iterator = iterator.into_iter();
+
+        // soundness: assumed trusted len
+        let (mut validity, offsets, values) = try_trusted_len_unzip(iterator)?;
+
+        if validity.as_mut().unwrap().unset_bits() == 0 {
+            validity = None;
+        }
+
+        Ok(Self::try_new(Self::default_data_type(), offsets, values, validity).unwrap())
+    }
+
+    /// Creates a [`MutableBinaryArray`] from an falible iterator of trusted length.
+    #[inline]
+    pub fn try_from_trusted_len_iter<E, I, P>(iterator: I) -> std::result::Result<Self, E>
+    where
+        P: AsRef<[u8]>,
+        I: TrustedLen<Item = std::result::Result<Option<P>, E>>,
+    {
+        // soundness: I: TrustedLen
+        unsafe { Self::try_from_trusted_len_iter_unchecked(iterator) }
+    }
+
+    /// Extends the [`MutableBinaryArray`] from an iterator of trusted length.
+    /// This differs from `extend_trusted_len` which accepts iterator of optional values.
+    #[inline]
+    pub fn extend_trusted_len_values<I, P>(&mut self, iterator: I)
+    where
+        P: AsRef<[u8]>,
+        I: TrustedLen<Item = P>,
+    {
+        // Safety: The iterator is `TrustedLen`
+        unsafe { self.extend_trusted_len_values_unchecked(iterator) }
+    }
+
+    /// Extends the [`MutableBinaryArray`] from an iterator of values.
+    /// This differs from `extended_trusted_len` which accepts iterator of optional values.
+    #[inline]
+    pub fn extend_values<I, P>(&mut self, iterator: I)
+    where
+        P: AsRef<[u8]>,
+        I: Iterator<Item = P>,
+    {
+        let length = self.values.len();
+        self.values.extend(iterator);
+        let additional = self.values.len() - length;
+
+        if let Some(validity) = self.validity.as_mut() {
+            validity.extend_constant(additional, true);
+        }
+    }
+
+    /// Extends the [`MutableBinaryArray`] from an `iterator` of values of trusted length.
+    /// This differs from `extend_trusted_len_unchecked` which accepts iterator of optional
+    /// values.
+    /// # Safety
+    /// The `iterator` must be [`TrustedLen`]
+    #[inline]
+    pub unsafe fn extend_trusted_len_values_unchecked<I, P>(&mut self, iterator: I)
+    where
+        P: AsRef<[u8]>,
+        I: Iterator<Item = P>,
+    {
+        let length = self.values.len();
+        self.values.extend_trusted_len_unchecked(iterator);
+        let additional = self.values.len() - length;
+
+        if let Some(validity) = self.validity.as_mut() {
+            validity.extend_constant(additional, true);
+        }
+    }
+
+    /// Extends the [`MutableBinaryArray`] from an iterator of [`TrustedLen`]
+    #[inline]
+    pub fn extend_trusted_len<I, P>(&mut self, iterator: I)
+    where
+        P: AsRef<[u8]>,
+        I: TrustedLen<Item = Option<P>>,
+    {
+        // Safety: The iterator is `TrustedLen`
+        unsafe { self.extend_trusted_len_unchecked(iterator) }
+    }
+
+    /// Extends the [`MutableBinaryArray`] from an iterator of [`TrustedLen`]
+    /// # Safety
+    /// The `iterator` must be [`TrustedLen`]
+    #[inline]
+    pub unsafe fn extend_trusted_len_unchecked<I, P>(&mut self, iterator: I)
+    where
+        P: AsRef<[u8]>,
+        I: Iterator<Item = Option<P>>,
+    {
+        if self.validity.is_none() {
+            let mut validity = MutableBitmap::new();
+            validity.extend_constant(self.len(), true);
+            self.validity = Some(validity);
+        }
+
+        self.values
+            .extend_from_trusted_len_iter(self.validity.as_mut().unwrap(), iterator);
+    }
+
+    /// Creates a new [`MutableBinaryArray`] from a [`Iterator`] of `&[u8]`.
+    pub fn from_iter_values<T: AsRef<[u8]>, I: Iterator<Item = T>>(iterator: I) -> Self {
+        let (offsets, values) = values_iter(iterator);
+        Self::try_new(Self::default_data_type(), offsets, values, None).unwrap()
+    }
+
+    /// Extend with a fallible iterator
+    pub fn extend_fallible<T, I, E>(&mut self, iter: I) -> std::result::Result<(), E>
+    where
+        E: std::error::Error,
+        I: IntoIterator<Item = std::result::Result<Option<T>, E>>,
+        T: AsRef<[u8]>,
+    {
+        let mut iter = iter.into_iter();
+        self.reserve(iter.size_hint().0, 0);
+        iter.try_for_each(|x| {
+            self.push(x?);
+            Ok(())
+        })
+    }
+}
+
+impl<O: Offset, T: AsRef<[u8]>> Extend<Option<T>> for MutableBinaryArray<O> {
+    fn extend<I: IntoIterator<Item = Option<T>>>(&mut self, iter: I) {
+        self.try_extend(iter).unwrap();
+    }
+}
+
+impl<O: Offset, T: AsRef<[u8]>> TryExtend<Option<T>> for MutableBinaryArray<O> {
+    fn try_extend<I: IntoIterator<Item = Option<T>>>(&mut self, iter: I) -> Result<()> {
+        let mut iter = iter.into_iter();
+        self.reserve(iter.size_hint().0, 0);
+        iter.try_for_each(|x| self.try_push(x))
+    }
+}
+
+impl<O: Offset, T: AsRef<[u8]>> TryPush<Option<T>> for MutableBinaryArray<O> {
+    fn try_push(&mut self, value: Option<T>) -> Result<()> {
+        match value {
+            Some(value) => {
+                self.values.try_push(value.as_ref())?;
+
+                match &mut self.validity {
+                    Some(validity) => validity.push(true),
+                    None => {},
+                }
+            },
+            None => {
+                self.values.push("");
+                match &mut self.validity {
+                    Some(validity) => validity.push(false),
+                    None => self.init_validity(),
+                }
+            },
+        }
+        Ok(())
+    }
+}
+
+impl<O: Offset> PartialEq for MutableBinaryArray<O> {
+    fn eq(&self, other: &Self) -> bool {
+        self.iter().eq(other.iter())
+    }
+}
+
+impl<O: Offset> TryExtendFromSelf for MutableBinaryArray<O> {
+    fn try_extend_from_self(&mut self, other: &Self) -> Result<()> {
+        extend_validity(self.len(), &mut self.validity, &other.validity);
+
+        self.values.try_extend_from_self(&other.values)
+    }
+}
diff --git a/crates/nano-arrow/src/array/binary/mutable_values.rs b/crates/nano-arrow/src/array/binary/mutable_values.rs
new file mode 100644
index 000000000000..e73f0223ec44
--- /dev/null
+++ b/crates/nano-arrow/src/array/binary/mutable_values.rs
@@ -0,0 +1,374 @@
+use std::iter::FromIterator;
+use std::sync::Arc;
+
+use super::{BinaryArray, MutableBinaryArray};
+use crate::array::physical_binary::*;
+use crate::array::specification::try_check_offsets_bounds;
+use crate::array::{
+    Array, ArrayAccessor, ArrayValuesIter, MutableArray, TryExtend, TryExtendFromSelf, TryPush,
+};
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+use crate::offset::{Offset, Offsets};
+use crate::trusted_len::TrustedLen;
+
+/// A [`MutableArray`] that builds a [`BinaryArray`]. It differs
+/// from [`MutableBinaryArray`] in that it builds non-null [`BinaryArray`].
+#[derive(Debug, Clone)]
+pub struct MutableBinaryValuesArray<O: Offset> {
+    data_type: DataType,
+    offsets: Offsets<O>,
+    values: Vec<u8>,
+}
+
+impl<O: Offset> From<MutableBinaryValuesArray<O>> for BinaryArray<O> {
+    fn from(other: MutableBinaryValuesArray<O>) -> Self {
+        BinaryArray::<O>::new(
+            other.data_type,
+            other.offsets.into(),
+            other.values.into(),
+            None,
+        )
+    }
+}
+
+impl<O: Offset> From<MutableBinaryValuesArray<O>> for MutableBinaryArray<O> {
+    fn from(other: MutableBinaryValuesArray<O>) -> Self {
+        MutableBinaryArray::<O>::try_new(other.data_type, other.offsets, other.values, None)
+            .expect("MutableBinaryValuesArray is consistent with MutableBinaryArray")
+    }
+}
+
+impl<O: Offset> Default for MutableBinaryValuesArray<O> {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl<O: Offset> MutableBinaryValuesArray<O> {
+    /// Returns an empty [`MutableBinaryValuesArray`].
+    pub fn new() -> Self {
+        Self {
+            data_type: Self::default_data_type(),
+            offsets: Offsets::new(),
+            values: Vec::<u8>::new(),
+        }
+    }
+
+    /// Returns a [`MutableBinaryValuesArray`] created from its internal representation.
+    ///
+    /// # Errors
+    /// This function returns an error iff:
+    /// * The last offset is not equal to the values' length.
+    /// * The `data_type`'s [`crate::datatypes::PhysicalType`] is not equal to either `Binary` or `LargeBinary`.
+    /// # Implementation
+    /// This function is `O(1)`
+    pub fn try_new(data_type: DataType, offsets: Offsets<O>, values: Vec<u8>) -> Result<Self> {
+        try_check_offsets_bounds(&offsets, values.len())?;
+
+        if data_type.to_physical_type() != Self::default_data_type().to_physical_type() {
+            return Err(Error::oos(
+                "MutableBinaryValuesArray can only be initialized with DataType::Binary or DataType::LargeBinary",
+            ));
+        }
+
+        Ok(Self {
+            data_type,
+            offsets,
+            values,
+        })
+    }
+
+    /// Returns the default [`DataType`] of this container: [`DataType::Utf8`] or [`DataType::LargeUtf8`]
+    /// depending on the generic [`Offset`].
+    pub fn default_data_type() -> DataType {
+        BinaryArray::<O>::default_data_type()
+    }
+
+    /// Initializes a new [`MutableBinaryValuesArray`] with a pre-allocated capacity of items.
+    pub fn with_capacity(capacity: usize) -> Self {
+        Self::with_capacities(capacity, 0)
+    }
+
+    /// Initializes a new [`MutableBinaryValuesArray`] with a pre-allocated capacity of items and values.
+    pub fn with_capacities(capacity: usize, values: usize) -> Self {
+        Self {
+            data_type: Self::default_data_type(),
+            offsets: Offsets::<O>::with_capacity(capacity),
+            values: Vec::<u8>::with_capacity(values),
+        }
+    }
+
+    /// returns its values.
+    #[inline]
+    pub fn values(&self) -> &Vec<u8> {
+        &self.values
+    }
+
+    /// returns its offsets.
+    #[inline]
+    pub fn offsets(&self) -> &Offsets<O> {
+        &self.offsets
+    }
+
+    /// Reserves `additional` elements and `additional_values` on the values.
+    #[inline]
+    pub fn reserve(&mut self, additional: usize, additional_values: usize) {
+        self.offsets.reserve(additional);
+        self.values.reserve(additional_values);
+    }
+
+    /// Returns the capacity in number of items
+    pub fn capacity(&self) -> usize {
+        self.offsets.capacity()
+    }
+
+    /// Returns the length of this array
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.offsets.len_proxy()
+    }
+
+    /// Pushes a new item to the array.
+    /// # Panic
+    /// This operation panics iff the length of all values (in bytes) exceeds `O` maximum value.
+    #[inline]
+    pub fn push<T: AsRef<[u8]>>(&mut self, value: T) {
+        self.try_push(value).unwrap()
+    }
+
+    /// Pop the last entry from [`MutableBinaryValuesArray`].
+    /// This function returns `None` iff this array is empty.
+    pub fn pop(&mut self) -> Option<Vec<u8>> {
+        if self.len() == 0 {
+            return None;
+        }
+        self.offsets.pop()?;
+        let start = self.offsets.last().to_usize();
+        let value = self.values.split_off(start);
+        Some(value.to_vec())
+    }
+
+    /// Returns the value of the element at index `i`.
+    /// # Panic
+    /// This function panics iff `i >= self.len`.
+    #[inline]
+    pub fn value(&self, i: usize) -> &[u8] {
+        assert!(i < self.len());
+        unsafe { self.value_unchecked(i) }
+    }
+
+    /// Returns the value of the element at index `i`.
+    /// # Safety
+    /// This function is safe iff `i < self.len`.
+    #[inline]
+    pub unsafe fn value_unchecked(&self, i: usize) -> &[u8] {
+        // soundness: the invariant of the function
+        let (start, end) = self.offsets.start_end(i);
+
+        // soundness: the invariant of the struct
+        self.values.get_unchecked(start..end)
+    }
+
+    /// Returns an iterator of `&[u8]`
+    pub fn iter(&self) -> ArrayValuesIter<Self> {
+        ArrayValuesIter::new(self)
+    }
+
+    /// Shrinks the capacity of the [`MutableBinaryValuesArray`] to fit its current length.
+    pub fn shrink_to_fit(&mut self) {
+        self.values.shrink_to_fit();
+        self.offsets.shrink_to_fit();
+    }
+
+    /// Extract the low-end APIs from the [`MutableBinaryValuesArray`].
+    pub fn into_inner(self) -> (DataType, Offsets<O>, Vec<u8>) {
+        (self.data_type, self.offsets, self.values)
+    }
+}
+
+impl<O: Offset> MutableArray for MutableBinaryValuesArray<O> {
+    fn len(&self) -> usize {
+        self.len()
+    }
+
+    fn validity(&self) -> Option<&MutableBitmap> {
+        None
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        let (data_type, offsets, values) = std::mem::take(self).into_inner();
+        BinaryArray::new(data_type, offsets.into(), values.into(), None).boxed()
+    }
+
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        let (data_type, offsets, values) = std::mem::take(self).into_inner();
+        BinaryArray::new(data_type, offsets.into(), values.into(), None).arced()
+    }
+
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    fn as_mut_any(&mut self) -> &mut dyn std::any::Any {
+        self
+    }
+
+    #[inline]
+    fn push_null(&mut self) {
+        self.push::<&[u8]>(b"")
+    }
+
+    fn reserve(&mut self, additional: usize) {
+        self.reserve(additional, 0)
+    }
+
+    fn shrink_to_fit(&mut self) {
+        self.shrink_to_fit()
+    }
+}
+
+impl<O: Offset, P: AsRef<[u8]>> FromIterator<P> for MutableBinaryValuesArray<O> {
+    fn from_iter<I: IntoIterator<Item = P>>(iter: I) -> Self {
+        let (offsets, values) = values_iter(iter.into_iter());
+        Self::try_new(Self::default_data_type(), offsets, values).unwrap()
+    }
+}
+
+impl<O: Offset> MutableBinaryValuesArray<O> {
+    pub(crate) unsafe fn extend_from_trusted_len_iter<I, P>(
+        &mut self,
+        validity: &mut MutableBitmap,
+        iterator: I,
+    ) where
+        P: AsRef<[u8]>,
+        I: Iterator<Item = Option<P>>,
+    {
+        extend_from_trusted_len_iter(&mut self.offsets, &mut self.values, validity, iterator);
+    }
+
+    /// Extends the [`MutableBinaryValuesArray`] from a [`TrustedLen`]
+    #[inline]
+    pub fn extend_trusted_len<I, P>(&mut self, iterator: I)
+    where
+        P: AsRef<[u8]>,
+        I: TrustedLen<Item = P>,
+    {
+        unsafe { self.extend_trusted_len_unchecked(iterator) }
+    }
+
+    /// Extends [`MutableBinaryValuesArray`] from an iterator of trusted len.
+    /// # Safety
+    /// The iterator must be trusted len.
+    #[inline]
+    pub unsafe fn extend_trusted_len_unchecked<I, P>(&mut self, iterator: I)
+    where
+        P: AsRef<[u8]>,
+        I: Iterator<Item = P>,
+    {
+        extend_from_trusted_len_values_iter(&mut self.offsets, &mut self.values, iterator);
+    }
+
+    /// Creates a [`MutableBinaryValuesArray`] from a [`TrustedLen`]
+    #[inline]
+    pub fn from_trusted_len_iter<I, P>(iterator: I) -> Self
+    where
+        P: AsRef<[u8]>,
+        I: TrustedLen<Item = P>,
+    {
+        // soundness: I is `TrustedLen`
+        unsafe { Self::from_trusted_len_iter_unchecked(iterator) }
+    }
+
+    /// Returns a new [`MutableBinaryValuesArray`] from an iterator of trusted length.
+    /// # Safety
+    /// The iterator must be [`TrustedLen`](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+    /// I.e. that `size_hint().1` correctly reports its length.
+    #[inline]
+    pub unsafe fn from_trusted_len_iter_unchecked<I, P>(iterator: I) -> Self
+    where
+        P: AsRef<[u8]>,
+        I: Iterator<Item = P>,
+    {
+        let (offsets, values) = trusted_len_values_iter(iterator);
+        Self::try_new(Self::default_data_type(), offsets, values).unwrap()
+    }
+
+    /// Returns a new [`MutableBinaryValuesArray`] from an iterator.
+    /// # Error
+    /// This operation errors iff the total length in bytes on the iterator exceeds `O`'s maximum value.
+    /// (`i32::MAX` or `i64::MAX` respectively).
+    pub fn try_from_iter<P: AsRef<[u8]>, I: IntoIterator<Item = P>>(iter: I) -> Result<Self> {
+        let iterator = iter.into_iter();
+        let (lower, _) = iterator.size_hint();
+        let mut array = Self::with_capacity(lower);
+        for item in iterator {
+            array.try_push(item)?;
+        }
+        Ok(array)
+    }
+
+    /// Extend with a fallible iterator
+    pub fn extend_fallible<T, I, E>(&mut self, iter: I) -> std::result::Result<(), E>
+    where
+        E: std::error::Error,
+        I: IntoIterator<Item = std::result::Result<T, E>>,
+        T: AsRef<[u8]>,
+    {
+        let mut iter = iter.into_iter();
+        self.reserve(iter.size_hint().0, 0);
+        iter.try_for_each(|x| {
+            self.push(x?);
+            Ok(())
+        })
+    }
+}
+
+impl<O: Offset, T: AsRef<[u8]>> Extend<T> for MutableBinaryValuesArray<O> {
+    fn extend<I: IntoIterator<Item = T>>(&mut self, iter: I) {
+        extend_from_values_iter(&mut self.offsets, &mut self.values, iter.into_iter());
+    }
+}
+
+impl<O: Offset, T: AsRef<[u8]>> TryExtend<T> for MutableBinaryValuesArray<O> {
+    fn try_extend<I: IntoIterator<Item = T>>(&mut self, iter: I) -> Result<()> {
+        let mut iter = iter.into_iter();
+        self.reserve(iter.size_hint().0, 0);
+        iter.try_for_each(|x| self.try_push(x))
+    }
+}
+
+impl<O: Offset, T: AsRef<[u8]>> TryPush<T> for MutableBinaryValuesArray<O> {
+    #[inline]
+    fn try_push(&mut self, value: T) -> Result<()> {
+        let bytes = value.as_ref();
+        self.values.extend_from_slice(bytes);
+        self.offsets.try_push_usize(bytes.len())
+    }
+}
+
+unsafe impl<'a, O: Offset> ArrayAccessor<'a> for MutableBinaryValuesArray<O> {
+    type Item = &'a [u8];
+
+    #[inline]
+    unsafe fn value_unchecked(&'a self, index: usize) -> Self::Item {
+        self.value_unchecked(index)
+    }
+
+    #[inline]
+    fn len(&self) -> usize {
+        self.len()
+    }
+}
+
+impl<O: Offset> TryExtendFromSelf for MutableBinaryValuesArray<O> {
+    fn try_extend_from_self(&mut self, other: &Self) -> Result<()> {
+        self.values.extend_from_slice(&other.values);
+        self.offsets.try_extend_from_self(&other.offsets)
+    }
+}
diff --git a/crates/nano-arrow/src/array/boolean/data.rs b/crates/nano-arrow/src/array/boolean/data.rs
new file mode 100644
index 000000000000..e93aeb3b8d2b
--- /dev/null
+++ b/crates/nano-arrow/src/array/boolean/data.rs
@@ -0,0 +1,36 @@
+use arrow_buffer::{BooleanBuffer, NullBuffer};
+use arrow_data::{ArrayData, ArrayDataBuilder};
+
+use crate::array::{Arrow2Arrow, BooleanArray};
+use crate::bitmap::Bitmap;
+use crate::datatypes::DataType;
+
+impl Arrow2Arrow for BooleanArray {
+    fn to_data(&self) -> ArrayData {
+        let buffer = NullBuffer::from(self.values.clone());
+
+        let builder = ArrayDataBuilder::new(arrow_schema::DataType::Boolean)
+            .len(buffer.len())
+            .offset(buffer.offset())
+            .buffers(vec![buffer.into_inner().into_inner()])
+            .nulls(self.validity.as_ref().map(|b| b.clone().into()));
+
+        // Safety: Array is valid
+        unsafe { builder.build_unchecked() }
+    }
+
+    fn from_data(data: &ArrayData) -> Self {
+        assert_eq!(data.data_type(), &arrow_schema::DataType::Boolean);
+
+        let buffers = data.buffers();
+        let buffer = BooleanBuffer::new(buffers[0].clone(), data.offset(), data.len());
+        // Use NullBuffer to compute set count
+        let values = Bitmap::from_null_buffer(NullBuffer::new(buffer));
+
+        Self {
+            data_type: DataType::Boolean,
+            values,
+            validity: data.nulls().map(|n| Bitmap::from_null_buffer(n.clone())),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/array/boolean/ffi.rs b/crates/nano-arrow/src/array/boolean/ffi.rs
new file mode 100644
index 000000000000..64f22de81d5d
--- /dev/null
+++ b/crates/nano-arrow/src/array/boolean/ffi.rs
@@ -0,0 +1,54 @@
+use super::BooleanArray;
+use crate::array::{FromFfi, ToFfi};
+use crate::bitmap::align;
+use crate::error::Result;
+use crate::ffi;
+
+unsafe impl ToFfi for BooleanArray {
+    fn buffers(&self) -> Vec<Option<*const u8>> {
+        vec![
+            self.validity.as_ref().map(|x| x.as_ptr()),
+            Some(self.values.as_ptr()),
+        ]
+    }
+
+    fn offset(&self) -> Option<usize> {
+        let offset = self.values.offset();
+        if let Some(bitmap) = self.validity.as_ref() {
+            if bitmap.offset() == offset {
+                Some(offset)
+            } else {
+                None
+            }
+        } else {
+            Some(offset)
+        }
+    }
+
+    fn to_ffi_aligned(&self) -> Self {
+        let offset = self.values.offset();
+
+        let validity = self.validity.as_ref().map(|bitmap| {
+            if bitmap.offset() == offset {
+                bitmap.clone()
+            } else {
+                align(bitmap, offset)
+            }
+        });
+
+        Self {
+            data_type: self.data_type.clone(),
+            validity,
+            values: self.values.clone(),
+        }
+    }
+}
+
+impl<A: ffi::ArrowArrayRef> FromFfi<A> for BooleanArray {
+    unsafe fn try_from_ffi(array: A) -> Result<Self> {
+        let data_type = array.data_type().clone();
+        let validity = unsafe { array.validity() }?;
+        let values = unsafe { array.bitmap(1) }?;
+        Self::try_new(data_type, values, validity)
+    }
+}
diff --git a/crates/nano-arrow/src/array/boolean/fmt.rs b/crates/nano-arrow/src/array/boolean/fmt.rs
new file mode 100644
index 000000000000..229a01cd3e03
--- /dev/null
+++ b/crates/nano-arrow/src/array/boolean/fmt.rs
@@ -0,0 +1,17 @@
+use std::fmt::{Debug, Formatter, Result, Write};
+
+use super::super::fmt::write_vec;
+use super::BooleanArray;
+
+pub fn write_value<W: Write>(array: &BooleanArray, index: usize, f: &mut W) -> Result {
+    write!(f, "{}", array.value(index))
+}
+
+impl Debug for BooleanArray {
+    fn fmt(&self, f: &mut Formatter) -> Result {
+        let writer = |f: &mut Formatter, index| write_value(self, index, f);
+
+        write!(f, "BooleanArray")?;
+        write_vec(f, writer, self.validity(), self.len(), "None", false)
+    }
+}
diff --git a/crates/nano-arrow/src/array/boolean/from.rs b/crates/nano-arrow/src/array/boolean/from.rs
new file mode 100644
index 000000000000..81a5395ccc06
--- /dev/null
+++ b/crates/nano-arrow/src/array/boolean/from.rs
@@ -0,0 +1,15 @@
+use std::iter::FromIterator;
+
+use super::{BooleanArray, MutableBooleanArray};
+
+impl<P: AsRef<[Option<bool>]>> From<P> for BooleanArray {
+    fn from(slice: P) -> Self {
+        MutableBooleanArray::from(slice).into()
+    }
+}
+
+impl<Ptr: std::borrow::Borrow<Option<bool>>> FromIterator<Ptr> for BooleanArray {
+    fn from_iter<I: IntoIterator<Item = Ptr>>(iter: I) -> Self {
+        MutableBooleanArray::from_iter(iter).into()
+    }
+}
diff --git a/crates/nano-arrow/src/array/boolean/iterator.rs b/crates/nano-arrow/src/array/boolean/iterator.rs
new file mode 100644
index 000000000000..8e914c98faab
--- /dev/null
+++ b/crates/nano-arrow/src/array/boolean/iterator.rs
@@ -0,0 +1,55 @@
+use super::super::MutableArray;
+use super::{BooleanArray, MutableBooleanArray};
+use crate::bitmap::utils::{BitmapIter, ZipValidity};
+use crate::bitmap::IntoIter;
+
+impl<'a> IntoIterator for &'a BooleanArray {
+    type Item = Option<bool>;
+    type IntoIter = ZipValidity<bool, BitmapIter<'a>, BitmapIter<'a>>;
+
+    #[inline]
+    fn into_iter(self) -> Self::IntoIter {
+        self.iter()
+    }
+}
+
+impl IntoIterator for BooleanArray {
+    type Item = Option<bool>;
+    type IntoIter = ZipValidity<bool, IntoIter, IntoIter>;
+
+    #[inline]
+    fn into_iter(self) -> Self::IntoIter {
+        let (_, values, validity) = self.into_inner();
+        let values = values.into_iter();
+        let validity =
+            validity.and_then(|validity| (validity.unset_bits() > 0).then(|| validity.into_iter()));
+        ZipValidity::new(values, validity)
+    }
+}
+
+impl<'a> IntoIterator for &'a MutableBooleanArray {
+    type Item = Option<bool>;
+    type IntoIter = ZipValidity<bool, BitmapIter<'a>, BitmapIter<'a>>;
+
+    #[inline]
+    fn into_iter(self) -> Self::IntoIter {
+        self.iter()
+    }
+}
+
+impl<'a> MutableBooleanArray {
+    /// Returns an iterator over the optional values of this [`MutableBooleanArray`].
+    #[inline]
+    pub fn iter(&'a self) -> ZipValidity<bool, BitmapIter<'a>, BitmapIter<'a>> {
+        ZipValidity::new(
+            self.values().iter(),
+            self.validity().as_ref().map(|x| x.iter()),
+        )
+    }
+
+    /// Returns an iterator over the values of this [`MutableBooleanArray`]
+    #[inline]
+    pub fn values_iter(&'a self) -> BitmapIter<'a> {
+        self.values().iter()
+    }
+}
diff --git a/crates/nano-arrow/src/array/boolean/mod.rs b/crates/nano-arrow/src/array/boolean/mod.rs
new file mode 100644
index 000000000000..93d484120faf
--- /dev/null
+++ b/crates/nano-arrow/src/array/boolean/mod.rs
@@ -0,0 +1,383 @@
+use either::Either;
+
+use super::Array;
+use crate::bitmap::utils::{BitmapIter, ZipValidity};
+use crate::bitmap::{Bitmap, MutableBitmap};
+use crate::datatypes::{DataType, PhysicalType};
+use crate::error::Error;
+use crate::trusted_len::TrustedLen;
+
+#[cfg(feature = "arrow")]
+mod data;
+mod ffi;
+pub(super) mod fmt;
+mod from;
+mod iterator;
+mod mutable;
+
+pub use iterator::*;
+pub use mutable::*;
+
+/// A [`BooleanArray`] is Arrow's semantically equivalent of an immutable `Vec<Option<bool>>`.
+/// It implements [`Array`].
+///
+/// One way to think about a [`BooleanArray`] is `(DataType, Arc<Vec<u8>>, Option<Arc<Vec<u8>>>)`
+/// where:
+/// * the first item is the array's logical type
+/// * the second is the immutable values
+/// * the third is the immutable validity (whether a value is null or not as a bitmap).
+///
+/// The size of this struct is `O(1)`, as all data is stored behind an [`std::sync::Arc`].
+/// # Example
+/// ```
+/// use arrow2::array::BooleanArray;
+/// use arrow2::bitmap::Bitmap;
+/// use arrow2::buffer::Buffer;
+///
+/// let array = BooleanArray::from([Some(true), None, Some(false)]);
+/// assert_eq!(array.value(0), true);
+/// assert_eq!(array.iter().collect::<Vec<_>>(), vec![Some(true), None, Some(false)]);
+/// assert_eq!(array.values_iter().collect::<Vec<_>>(), vec![true, false, false]);
+/// // the underlying representation
+/// assert_eq!(array.values(), &Bitmap::from([true, false, false]));
+/// assert_eq!(array.validity(), Some(&Bitmap::from([true, false, true])));
+///
+/// ```
+#[derive(Clone)]
+pub struct BooleanArray {
+    data_type: DataType,
+    values: Bitmap,
+    validity: Option<Bitmap>,
+}
+
+impl BooleanArray {
+    /// The canonical method to create a [`BooleanArray`] out of low-end APIs.
+    /// # Errors
+    /// This function errors iff:
+    /// * The validity is not `None` and its length is different from `values`'s length
+    /// * The `data_type`'s [`PhysicalType`] is not equal to [`PhysicalType::Boolean`].
+    pub fn try_new(
+        data_type: DataType,
+        values: Bitmap,
+        validity: Option<Bitmap>,
+    ) -> Result<Self, Error> {
+        if validity
+            .as_ref()
+            .map_or(false, |validity| validity.len() != values.len())
+        {
+            return Err(Error::oos(
+                "validity mask length must match the number of values",
+            ));
+        }
+
+        if data_type.to_physical_type() != PhysicalType::Boolean {
+            return Err(Error::oos(
+                "BooleanArray can only be initialized with a DataType whose physical type is Boolean",
+            ));
+        }
+
+        Ok(Self {
+            data_type,
+            values,
+            validity,
+        })
+    }
+
+    /// Alias to `Self::try_new().unwrap()`
+    pub fn new(data_type: DataType, values: Bitmap, validity: Option<Bitmap>) -> Self {
+        Self::try_new(data_type, values, validity).unwrap()
+    }
+
+    /// Returns an iterator over the optional values of this [`BooleanArray`].
+    #[inline]
+    pub fn iter(&self) -> ZipValidity<bool, BitmapIter, BitmapIter> {
+        ZipValidity::new_with_validity(self.values().iter(), self.validity())
+    }
+
+    /// Returns an iterator over the values of this [`BooleanArray`].
+    #[inline]
+    pub fn values_iter(&self) -> BitmapIter {
+        self.values().iter()
+    }
+
+    /// Returns the length of this array
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.values.len()
+    }
+
+    /// The values [`Bitmap`].
+    /// Values on null slots are undetermined (they can be anything).
+    #[inline]
+    pub fn values(&self) -> &Bitmap {
+        &self.values
+    }
+
+    /// Returns the optional validity.
+    #[inline]
+    pub fn validity(&self) -> Option<&Bitmap> {
+        self.validity.as_ref()
+    }
+
+    /// Returns the arrays' [`DataType`].
+    #[inline]
+    pub fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    /// Returns the value at index `i`
+    /// # Panic
+    /// This function panics iff `i >= self.len()`.
+    #[inline]
+    pub fn value(&self, i: usize) -> bool {
+        self.values.get_bit(i)
+    }
+
+    /// Returns the element at index `i` as bool
+    /// # Safety
+    /// Caller must be sure that `i < self.len()`
+    #[inline]
+    pub unsafe fn value_unchecked(&self, i: usize) -> bool {
+        self.values.get_bit_unchecked(i)
+    }
+
+    /// Returns the element at index `i` or `None` if it is null
+    /// # Panics
+    /// iff `i >= self.len()`
+    #[inline]
+    pub fn get(&self, i: usize) -> Option<bool> {
+        if !self.is_null(i) {
+            // soundness: Array::is_null panics if i >= self.len
+            unsafe { Some(self.value_unchecked(i)) }
+        } else {
+            None
+        }
+    }
+
+    /// Slices this [`BooleanArray`].
+    /// # Implementation
+    /// This operation is `O(1)` as it amounts to increase up to two ref counts.
+    /// # Panic
+    /// This function panics iff `offset + length > self.len()`.
+    #[inline]
+    pub fn slice(&mut self, offset: usize, length: usize) {
+        assert!(
+            offset + length <= self.len(),
+            "the offset of the new Buffer cannot exceed the existing length"
+        );
+        unsafe { self.slice_unchecked(offset, length) }
+    }
+
+    /// Slices this [`BooleanArray`].
+    /// # Implementation
+    /// This operation is `O(1)` as it amounts to increase two ref counts.
+    /// # Safety
+    /// The caller must ensure that `offset + length <= self.len()`.
+    #[inline]
+    pub unsafe fn slice_unchecked(&mut self, offset: usize, length: usize) {
+        self.validity.as_mut().and_then(|bitmap| {
+            bitmap.slice_unchecked(offset, length);
+            (bitmap.unset_bits() > 0).then(|| bitmap)
+        });
+        self.values.slice_unchecked(offset, length);
+    }
+
+    impl_sliced!();
+    impl_mut_validity!();
+    impl_into_array!();
+
+    /// Returns a clone of this [`BooleanArray`] with new values.
+    /// # Panics
+    /// This function panics iff `values.len() != self.len()`.
+    #[must_use]
+    pub fn with_values(&self, values: Bitmap) -> Self {
+        let mut out = self.clone();
+        out.set_values(values);
+        out
+    }
+
+    /// Sets the values of this [`BooleanArray`].
+    /// # Panics
+    /// This function panics iff `values.len() != self.len()`.
+    pub fn set_values(&mut self, values: Bitmap) {
+        assert_eq!(
+            values.len(),
+            self.len(),
+            "values length must be equal to this arrays length"
+        );
+        self.values = values;
+    }
+
+    /// Applies a function `f` to the values of this array, cloning the values
+    /// iff they are being shared with others
+    ///
+    /// This is an API to use clone-on-write
+    /// # Implementation
+    /// This function is `O(f)` if the data is not being shared, and `O(N) + O(f)`
+    /// if it is being shared (since it results in a `O(N)` memcopy).
+    /// # Panics
+    /// This function panics if the function modifies the length of the [`MutableBitmap`].
+    pub fn apply_values_mut<F: Fn(&mut MutableBitmap)>(&mut self, f: F) {
+        let values = std::mem::take(&mut self.values);
+        let mut values = values.make_mut();
+        f(&mut values);
+        if let Some(validity) = &self.validity {
+            assert_eq!(validity.len(), values.len());
+        }
+        self.values = values.into();
+    }
+
+    /// Try to convert this [`BooleanArray`] to a [`MutableBooleanArray`]
+    pub fn into_mut(self) -> Either<Self, MutableBooleanArray> {
+        use Either::*;
+
+        if let Some(bitmap) = self.validity {
+            match bitmap.into_mut() {
+                Left(bitmap) => Left(BooleanArray::new(self.data_type, self.values, Some(bitmap))),
+                Right(mutable_bitmap) => match self.values.into_mut() {
+                    Left(immutable) => Left(BooleanArray::new(
+                        self.data_type,
+                        immutable,
+                        Some(mutable_bitmap.into()),
+                    )),
+                    Right(mutable) => Right(
+                        MutableBooleanArray::try_new(self.data_type, mutable, Some(mutable_bitmap))
+                            .unwrap(),
+                    ),
+                },
+            }
+        } else {
+            match self.values.into_mut() {
+                Left(immutable) => Left(BooleanArray::new(self.data_type, immutable, None)),
+                Right(mutable) => {
+                    Right(MutableBooleanArray::try_new(self.data_type, mutable, None).unwrap())
+                },
+            }
+        }
+    }
+
+    /// Returns a new empty [`BooleanArray`].
+    pub fn new_empty(data_type: DataType) -> Self {
+        Self::new(data_type, Bitmap::new(), None)
+    }
+
+    /// Returns a new [`BooleanArray`] whose all slots are null / `None`.
+    pub fn new_null(data_type: DataType, length: usize) -> Self {
+        let bitmap = Bitmap::new_zeroed(length);
+        Self::new(data_type, bitmap.clone(), Some(bitmap))
+    }
+
+    /// Creates a new [`BooleanArray`] from an [`TrustedLen`] of `bool`.
+    #[inline]
+    pub fn from_trusted_len_values_iter<I: TrustedLen<Item = bool>>(iterator: I) -> Self {
+        MutableBooleanArray::from_trusted_len_values_iter(iterator).into()
+    }
+
+    /// Creates a new [`BooleanArray`] from an [`TrustedLen`] of `bool`.
+    /// Use this over [`BooleanArray::from_trusted_len_iter`] when the iterator is trusted len
+    /// but this crate does not mark it as such.
+    /// # Safety
+    /// The iterator must be [`TrustedLen`](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+    /// I.e. that `size_hint().1` correctly reports its length.
+    #[inline]
+    pub unsafe fn from_trusted_len_values_iter_unchecked<I: Iterator<Item = bool>>(
+        iterator: I,
+    ) -> Self {
+        MutableBooleanArray::from_trusted_len_values_iter_unchecked(iterator).into()
+    }
+
+    /// Creates a new [`BooleanArray`] from a slice of `bool`.
+    #[inline]
+    pub fn from_slice<P: AsRef<[bool]>>(slice: P) -> Self {
+        MutableBooleanArray::from_slice(slice).into()
+    }
+
+    /// Creates a [`BooleanArray`] from an iterator of trusted length.
+    /// Use this over [`BooleanArray::from_trusted_len_iter`] when the iterator is trusted len
+    /// but this crate does not mark it as such.
+    /// # Safety
+    /// The iterator must be [`TrustedLen`](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+    /// I.e. that `size_hint().1` correctly reports its length.
+    #[inline]
+    pub unsafe fn from_trusted_len_iter_unchecked<I, P>(iterator: I) -> Self
+    where
+        P: std::borrow::Borrow<bool>,
+        I: Iterator<Item = Option<P>>,
+    {
+        MutableBooleanArray::from_trusted_len_iter_unchecked(iterator).into()
+    }
+
+    /// Creates a [`BooleanArray`] from a [`TrustedLen`].
+    #[inline]
+    pub fn from_trusted_len_iter<I, P>(iterator: I) -> Self
+    where
+        P: std::borrow::Borrow<bool>,
+        I: TrustedLen<Item = Option<P>>,
+    {
+        MutableBooleanArray::from_trusted_len_iter(iterator).into()
+    }
+
+    /// Creates a [`BooleanArray`] from an falible iterator of trusted length.
+    /// # Safety
+    /// The iterator must be [`TrustedLen`](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+    /// I.e. that `size_hint().1` correctly reports its length.
+    #[inline]
+    pub unsafe fn try_from_trusted_len_iter_unchecked<E, I, P>(iterator: I) -> Result<Self, E>
+    where
+        P: std::borrow::Borrow<bool>,
+        I: Iterator<Item = Result<Option<P>, E>>,
+    {
+        Ok(MutableBooleanArray::try_from_trusted_len_iter_unchecked(iterator)?.into())
+    }
+
+    /// Creates a [`BooleanArray`] from a [`TrustedLen`].
+    #[inline]
+    pub fn try_from_trusted_len_iter<E, I, P>(iterator: I) -> Result<Self, E>
+    where
+        P: std::borrow::Borrow<bool>,
+        I: TrustedLen<Item = Result<Option<P>, E>>,
+    {
+        Ok(MutableBooleanArray::try_from_trusted_len_iter(iterator)?.into())
+    }
+
+    /// Returns its internal representation
+    #[must_use]
+    pub fn into_inner(self) -> (DataType, Bitmap, Option<Bitmap>) {
+        let Self {
+            data_type,
+            values,
+            validity,
+        } = self;
+        (data_type, values, validity)
+    }
+
+    /// Creates a `[BooleanArray]` from its internal representation.
+    /// This is the inverted from `[BooleanArray::into_inner]`
+    ///
+    /// # Safety
+    /// Callers must ensure all invariants of this struct are upheld.
+    pub unsafe fn from_inner_unchecked(
+        data_type: DataType,
+        values: Bitmap,
+        validity: Option<Bitmap>,
+    ) -> Self {
+        Self {
+            data_type,
+            values,
+            validity,
+        }
+    }
+}
+
+impl Array for BooleanArray {
+    impl_common_array!();
+
+    fn validity(&self) -> Option<&Bitmap> {
+        self.validity.as_ref()
+    }
+
+    #[inline]
+    fn with_validity(&self, validity: Option<Bitmap>) -> Box<dyn Array> {
+        Box::new(self.clone().with_validity(validity))
+    }
+}
diff --git a/crates/nano-arrow/src/array/boolean/mutable.rs b/crates/nano-arrow/src/array/boolean/mutable.rs
new file mode 100644
index 000000000000..9961cadcb2fd
--- /dev/null
+++ b/crates/nano-arrow/src/array/boolean/mutable.rs
@@ -0,0 +1,564 @@
+use std::iter::FromIterator;
+use std::sync::Arc;
+
+use super::BooleanArray;
+use crate::array::physical_binary::extend_validity;
+use crate::array::{Array, MutableArray, TryExtend, TryExtendFromSelf, TryPush};
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::{DataType, PhysicalType};
+use crate::error::Error;
+use crate::trusted_len::TrustedLen;
+
+/// The Arrow's equivalent to `Vec<Option<bool>>`, but with `1/16` of its size.
+/// Converting a [`MutableBooleanArray`] into a [`BooleanArray`] is `O(1)`.
+/// # Implementation
+/// This struct does not allocate a validity until one is required (i.e. push a null to it).
+#[derive(Debug, Clone)]
+pub struct MutableBooleanArray {
+    data_type: DataType,
+    values: MutableBitmap,
+    validity: Option<MutableBitmap>,
+}
+
+impl From<MutableBooleanArray> for BooleanArray {
+    fn from(other: MutableBooleanArray) -> Self {
+        BooleanArray::new(
+            other.data_type,
+            other.values.into(),
+            other.validity.map(|x| x.into()),
+        )
+    }
+}
+
+impl<P: AsRef<[Option<bool>]>> From<P> for MutableBooleanArray {
+    /// Creates a new [`MutableBooleanArray`] out of a slice of Optional `bool`.
+    fn from(slice: P) -> Self {
+        Self::from_trusted_len_iter(slice.as_ref().iter().map(|x| x.as_ref()))
+    }
+}
+
+impl Default for MutableBooleanArray {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl MutableBooleanArray {
+    /// Creates an new empty [`MutableBooleanArray`].
+    pub fn new() -> Self {
+        Self::with_capacity(0)
+    }
+
+    /// The canonical method to create a [`MutableBooleanArray`] out of low-end APIs.
+    /// # Errors
+    /// This function errors iff:
+    /// * The validity is not `None` and its length is different from `values`'s length
+    /// * The `data_type`'s [`PhysicalType`] is not equal to [`PhysicalType::Boolean`].
+    pub fn try_new(
+        data_type: DataType,
+        values: MutableBitmap,
+        validity: Option<MutableBitmap>,
+    ) -> Result<Self, Error> {
+        if validity
+            .as_ref()
+            .map_or(false, |validity| validity.len() != values.len())
+        {
+            return Err(Error::oos(
+                "validity mask length must match the number of values",
+            ));
+        }
+
+        if data_type.to_physical_type() != PhysicalType::Boolean {
+            return Err(Error::oos(
+                "MutableBooleanArray can only be initialized with a DataType whose physical type is Boolean",
+            ));
+        }
+
+        Ok(Self {
+            data_type,
+            values,
+            validity,
+        })
+    }
+
+    /// Creates an new [`MutableBooleanArray`] with a capacity of values.
+    pub fn with_capacity(capacity: usize) -> Self {
+        Self {
+            data_type: DataType::Boolean,
+            values: MutableBitmap::with_capacity(capacity),
+            validity: None,
+        }
+    }
+
+    /// Reserves `additional` slots.
+    pub fn reserve(&mut self, additional: usize) {
+        self.values.reserve(additional);
+        if let Some(x) = self.validity.as_mut() {
+            x.reserve(additional)
+        }
+    }
+
+    /// Pushes a new entry to [`MutableBooleanArray`].
+    pub fn push(&mut self, value: Option<bool>) {
+        match value {
+            Some(value) => {
+                self.values.push(value);
+                match &mut self.validity {
+                    Some(validity) => validity.push(true),
+                    None => {},
+                }
+            },
+            None => {
+                self.values.push(false);
+                match &mut self.validity {
+                    Some(validity) => validity.push(false),
+                    None => self.init_validity(),
+                }
+            },
+        }
+    }
+
+    /// Pop an entry from [`MutableBooleanArray`].
+    /// Note If the values is empty, this method will return None.
+    pub fn pop(&mut self) -> Option<bool> {
+        let value = self.values.pop()?;
+        self.validity
+            .as_mut()
+            .map(|x| x.pop()?.then(|| value))
+            .unwrap_or_else(|| Some(value))
+    }
+
+    /// Extends the [`MutableBooleanArray`] from an iterator of values of trusted len.
+    /// This differs from `extend_trusted_len` which accepts in iterator of optional values.
+    #[inline]
+    pub fn extend_trusted_len_values<I>(&mut self, iterator: I)
+    where
+        I: TrustedLen<Item = bool>,
+    {
+        // Safety: `I` is `TrustedLen`
+        unsafe { self.extend_trusted_len_values_unchecked(iterator) }
+    }
+
+    /// Extends the [`MutableBooleanArray`] from an iterator of values of trusted len.
+    /// This differs from `extend_trusted_len_unchecked`, which accepts in iterator of optional values.
+    /// # Safety
+    /// The iterator must be trusted len.
+    #[inline]
+    pub unsafe fn extend_trusted_len_values_unchecked<I>(&mut self, iterator: I)
+    where
+        I: Iterator<Item = bool>,
+    {
+        let (_, upper) = iterator.size_hint();
+        let additional =
+            upper.expect("extend_trusted_len_values_unchecked requires an upper limit");
+
+        if let Some(validity) = self.validity.as_mut() {
+            validity.extend_constant(additional, true);
+        }
+
+        self.values.extend_from_trusted_len_iter_unchecked(iterator)
+    }
+
+    /// Extends the [`MutableBooleanArray`] from an iterator of trusted len.
+    #[inline]
+    pub fn extend_trusted_len<I, P>(&mut self, iterator: I)
+    where
+        P: std::borrow::Borrow<bool>,
+        I: TrustedLen<Item = Option<P>>,
+    {
+        // Safety: `I` is `TrustedLen`
+        unsafe { self.extend_trusted_len_unchecked(iterator) }
+    }
+
+    /// Extends the [`MutableBooleanArray`] from an iterator of trusted len.
+    /// # Safety
+    /// The iterator must be trusted len.
+    #[inline]
+    pub unsafe fn extend_trusted_len_unchecked<I, P>(&mut self, iterator: I)
+    where
+        P: std::borrow::Borrow<bool>,
+        I: Iterator<Item = Option<P>>,
+    {
+        if let Some(validity) = self.validity.as_mut() {
+            extend_trusted_len_unzip(iterator, validity, &mut self.values);
+        } else {
+            let mut validity = MutableBitmap::new();
+            validity.extend_constant(self.len(), true);
+
+            extend_trusted_len_unzip(iterator, &mut validity, &mut self.values);
+
+            if validity.unset_bits() > 0 {
+                self.validity = Some(validity);
+            }
+        }
+    }
+
+    fn init_validity(&mut self) {
+        let mut validity = MutableBitmap::with_capacity(self.values.capacity());
+        validity.extend_constant(self.len(), true);
+        validity.set(self.len() - 1, false);
+        self.validity = Some(validity)
+    }
+
+    /// Converts itself into an [`Array`].
+    pub fn into_arc(self) -> Arc<dyn Array> {
+        let a: BooleanArray = self.into();
+        Arc::new(a)
+    }
+}
+
+/// Getters
+impl MutableBooleanArray {
+    /// Returns its values.
+    pub fn values(&self) -> &MutableBitmap {
+        &self.values
+    }
+}
+
+/// Setters
+impl MutableBooleanArray {
+    /// Sets position `index` to `value`.
+    /// Note that if it is the first time a null appears in this array,
+    /// this initializes the validity bitmap (`O(N)`).
+    /// # Panic
+    /// Panics iff index is larger than `self.len()`.
+    pub fn set(&mut self, index: usize, value: Option<bool>) {
+        self.values.set(index, value.unwrap_or_default());
+
+        if value.is_none() && self.validity.is_none() {
+            // When the validity is None, all elements so far are valid. When one of the elements is set of null,
+            // the validity must be initialized.
+            self.validity = Some(MutableBitmap::from_trusted_len_iter(
+                std::iter::repeat(true).take(self.len()),
+            ));
+        }
+        if let Some(x) = self.validity.as_mut() {
+            x.set(index, value.is_some())
+        }
+    }
+}
+
+/// From implementations
+impl MutableBooleanArray {
+    /// Creates a new [`MutableBooleanArray`] from an [`TrustedLen`] of `bool`.
+    #[inline]
+    pub fn from_trusted_len_values_iter<I: TrustedLen<Item = bool>>(iterator: I) -> Self {
+        Self::try_new(
+            DataType::Boolean,
+            MutableBitmap::from_trusted_len_iter(iterator),
+            None,
+        )
+        .unwrap()
+    }
+
+    /// Creates a new [`MutableBooleanArray`] from an [`TrustedLen`] of `bool`.
+    /// Use this over [`BooleanArray::from_trusted_len_iter`] when the iterator is trusted len
+    /// but this crate does not mark it as such.
+    /// # Safety
+    /// The iterator must be [`TrustedLen`](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+    /// I.e. that `size_hint().1` correctly reports its length.
+    #[inline]
+    pub unsafe fn from_trusted_len_values_iter_unchecked<I: Iterator<Item = bool>>(
+        iterator: I,
+    ) -> Self {
+        let mut mutable = MutableBitmap::new();
+        mutable.extend_from_trusted_len_iter_unchecked(iterator);
+        MutableBooleanArray::try_new(DataType::Boolean, mutable, None).unwrap()
+    }
+
+    /// Creates a new [`MutableBooleanArray`] from a slice of `bool`.
+    #[inline]
+    pub fn from_slice<P: AsRef<[bool]>>(slice: P) -> Self {
+        Self::from_trusted_len_values_iter(slice.as_ref().iter().copied())
+    }
+
+    /// Creates a [`BooleanArray`] from an iterator of trusted length.
+    /// Use this over [`BooleanArray::from_trusted_len_iter`] when the iterator is trusted len
+    /// but this crate does not mark it as such.
+    /// # Safety
+    /// The iterator must be [`TrustedLen`](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+    /// I.e. that `size_hint().1` correctly reports its length.
+    #[inline]
+    pub unsafe fn from_trusted_len_iter_unchecked<I, P>(iterator: I) -> Self
+    where
+        P: std::borrow::Borrow<bool>,
+        I: Iterator<Item = Option<P>>,
+    {
+        let (validity, values) = trusted_len_unzip(iterator);
+
+        Self::try_new(DataType::Boolean, values, validity).unwrap()
+    }
+
+    /// Creates a [`BooleanArray`] from a [`TrustedLen`].
+    #[inline]
+    pub fn from_trusted_len_iter<I, P>(iterator: I) -> Self
+    where
+        P: std::borrow::Borrow<bool>,
+        I: TrustedLen<Item = Option<P>>,
+    {
+        // Safety: `I` is `TrustedLen`
+        unsafe { Self::from_trusted_len_iter_unchecked(iterator) }
+    }
+
+    /// Creates a [`BooleanArray`] from an falible iterator of trusted length.
+    /// # Safety
+    /// The iterator must be [`TrustedLen`](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+    /// I.e. that `size_hint().1` correctly reports its length.
+    #[inline]
+    pub unsafe fn try_from_trusted_len_iter_unchecked<E, I, P>(
+        iterator: I,
+    ) -> std::result::Result<Self, E>
+    where
+        P: std::borrow::Borrow<bool>,
+        I: Iterator<Item = std::result::Result<Option<P>, E>>,
+    {
+        let (validity, values) = try_trusted_len_unzip(iterator)?;
+
+        let validity = if validity.unset_bits() > 0 {
+            Some(validity)
+        } else {
+            None
+        };
+
+        Ok(Self::try_new(DataType::Boolean, values, validity).unwrap())
+    }
+
+    /// Creates a [`BooleanArray`] from a [`TrustedLen`].
+    #[inline]
+    pub fn try_from_trusted_len_iter<E, I, P>(iterator: I) -> std::result::Result<Self, E>
+    where
+        P: std::borrow::Borrow<bool>,
+        I: TrustedLen<Item = std::result::Result<Option<P>, E>>,
+    {
+        // Safety: `I` is `TrustedLen`
+        unsafe { Self::try_from_trusted_len_iter_unchecked(iterator) }
+    }
+
+    /// Shrinks the capacity of the [`MutableBooleanArray`] to fit its current length.
+    pub fn shrink_to_fit(&mut self) {
+        self.values.shrink_to_fit();
+        if let Some(validity) = &mut self.validity {
+            validity.shrink_to_fit()
+        }
+    }
+}
+
+/// Creates a Bitmap and an optional [`MutableBitmap`] from an iterator of `Option<bool>`.
+/// The first buffer corresponds to a bitmap buffer, the second one
+/// corresponds to a values buffer.
+/// # Safety
+/// The caller must ensure that `iterator` is `TrustedLen`.
+#[inline]
+pub(crate) unsafe fn trusted_len_unzip<I, P>(iterator: I) -> (Option<MutableBitmap>, MutableBitmap)
+where
+    P: std::borrow::Borrow<bool>,
+    I: Iterator<Item = Option<P>>,
+{
+    let mut validity = MutableBitmap::new();
+    let mut values = MutableBitmap::new();
+
+    extend_trusted_len_unzip(iterator, &mut validity, &mut values);
+
+    let validity = if validity.unset_bits() > 0 {
+        Some(validity)
+    } else {
+        None
+    };
+
+    (validity, values)
+}
+
+/// Extends validity [`MutableBitmap`] and values [`MutableBitmap`] from an iterator of `Option`.
+/// # Safety
+/// The caller must ensure that `iterator` is `TrustedLen`.
+#[inline]
+pub(crate) unsafe fn extend_trusted_len_unzip<I, P>(
+    iterator: I,
+    validity: &mut MutableBitmap,
+    values: &mut MutableBitmap,
+) where
+    P: std::borrow::Borrow<bool>,
+    I: Iterator<Item = Option<P>>,
+{
+    let (_, upper) = iterator.size_hint();
+    let additional = upper.expect("extend_trusted_len_unzip requires an upper limit");
+
+    // Length of the array before new values are pushed,
+    // variable created for assertion post operation
+    let pre_length = values.len();
+
+    validity.reserve(additional);
+    values.reserve(additional);
+
+    for item in iterator {
+        let item = if let Some(item) = item {
+            validity.push_unchecked(true);
+            *item.borrow()
+        } else {
+            validity.push_unchecked(false);
+            bool::default()
+        };
+        values.push_unchecked(item);
+    }
+
+    debug_assert_eq!(
+        values.len(),
+        pre_length + additional,
+        "Trusted iterator length was not accurately reported"
+    );
+}
+
+/// # Safety
+/// The caller must ensure that `iterator` is `TrustedLen`.
+#[inline]
+pub(crate) unsafe fn try_trusted_len_unzip<E, I, P>(
+    iterator: I,
+) -> std::result::Result<(MutableBitmap, MutableBitmap), E>
+where
+    P: std::borrow::Borrow<bool>,
+    I: Iterator<Item = std::result::Result<Option<P>, E>>,
+{
+    let (_, upper) = iterator.size_hint();
+    let len = upper.expect("trusted_len_unzip requires an upper limit");
+
+    let mut null = MutableBitmap::with_capacity(len);
+    let mut values = MutableBitmap::with_capacity(len);
+
+    for item in iterator {
+        let item = if let Some(item) = item? {
+            null.push(true);
+            *item.borrow()
+        } else {
+            null.push(false);
+            false
+        };
+        values.push(item);
+    }
+    assert_eq!(
+        values.len(),
+        len,
+        "Trusted iterator length was not accurately reported"
+    );
+    values.set_len(len);
+    null.set_len(len);
+
+    Ok((null, values))
+}
+
+impl<Ptr: std::borrow::Borrow<Option<bool>>> FromIterator<Ptr> for MutableBooleanArray {
+    fn from_iter<I: IntoIterator<Item = Ptr>>(iter: I) -> Self {
+        let iter = iter.into_iter();
+        let (lower, _) = iter.size_hint();
+
+        let mut validity = MutableBitmap::with_capacity(lower);
+
+        let values: MutableBitmap = iter
+            .map(|item| {
+                if let Some(a) = item.borrow() {
+                    validity.push(true);
+                    *a
+                } else {
+                    validity.push(false);
+                    false
+                }
+            })
+            .collect();
+
+        let validity = if validity.unset_bits() > 0 {
+            Some(validity)
+        } else {
+            None
+        };
+
+        MutableBooleanArray::try_new(DataType::Boolean, values, validity).unwrap()
+    }
+}
+
+impl MutableArray for MutableBooleanArray {
+    fn len(&self) -> usize {
+        self.values.len()
+    }
+
+    fn validity(&self) -> Option<&MutableBitmap> {
+        self.validity.as_ref()
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        let array: BooleanArray = std::mem::take(self).into();
+        array.boxed()
+    }
+
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        let array: BooleanArray = std::mem::take(self).into();
+        array.arced()
+    }
+
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    fn as_mut_any(&mut self) -> &mut dyn std::any::Any {
+        self
+    }
+
+    #[inline]
+    fn push_null(&mut self) {
+        self.push(None)
+    }
+
+    fn reserve(&mut self, additional: usize) {
+        self.reserve(additional)
+    }
+
+    fn shrink_to_fit(&mut self) {
+        self.shrink_to_fit()
+    }
+}
+
+impl Extend<Option<bool>> for MutableBooleanArray {
+    fn extend<I: IntoIterator<Item = Option<bool>>>(&mut self, iter: I) {
+        let iter = iter.into_iter();
+        self.reserve(iter.size_hint().0);
+        iter.for_each(|x| self.push(x))
+    }
+}
+
+impl TryExtend<Option<bool>> for MutableBooleanArray {
+    /// This is infalible and is implemented for consistency with all other types
+    fn try_extend<I: IntoIterator<Item = Option<bool>>>(&mut self, iter: I) -> Result<(), Error> {
+        self.extend(iter);
+        Ok(())
+    }
+}
+
+impl TryPush<Option<bool>> for MutableBooleanArray {
+    /// This is infalible and is implemented for consistency with all other types
+    fn try_push(&mut self, item: Option<bool>) -> Result<(), Error> {
+        self.push(item);
+        Ok(())
+    }
+}
+
+impl PartialEq for MutableBooleanArray {
+    fn eq(&self, other: &Self) -> bool {
+        self.iter().eq(other.iter())
+    }
+}
+
+impl TryExtendFromSelf for MutableBooleanArray {
+    fn try_extend_from_self(&mut self, other: &Self) -> Result<(), Error> {
+        extend_validity(self.len(), &mut self.validity, &other.validity);
+
+        let slice = other.values.as_slice();
+        // safety: invariant offset + length <= slice.len()
+        unsafe {
+            self.values
+                .extend_from_slice_unchecked(slice, 0, other.values.len());
+        }
+        Ok(())
+    }
+}
diff --git a/crates/nano-arrow/src/array/dictionary/data.rs b/crates/nano-arrow/src/array/dictionary/data.rs
new file mode 100644
index 000000000000..ecc763c350b3
--- /dev/null
+++ b/crates/nano-arrow/src/array/dictionary/data.rs
@@ -0,0 +1,49 @@
+use arrow_data::{ArrayData, ArrayDataBuilder};
+
+use crate::array::{
+    from_data, to_data, Arrow2Arrow, DictionaryArray, DictionaryKey, PrimitiveArray,
+};
+use crate::datatypes::{DataType, PhysicalType};
+
+impl<K: DictionaryKey> Arrow2Arrow for DictionaryArray<K> {
+    fn to_data(&self) -> ArrayData {
+        let keys = self.keys.to_data();
+        let builder = keys
+            .into_builder()
+            .data_type(self.data_type.clone().into())
+            .child_data(vec![to_data(self.values.as_ref())]);
+
+        // Safety: Dictionary is valid
+        unsafe { builder.build_unchecked() }
+    }
+
+    fn from_data(data: &ArrayData) -> Self {
+        let key = match data.data_type() {
+            arrow_schema::DataType::Dictionary(k, _) => k.as_ref(),
+            d => panic!("unsupported dictionary type {d}"),
+        };
+
+        let data_type = DataType::from(data.data_type().clone());
+        assert_eq!(
+            data_type.to_physical_type(),
+            PhysicalType::Dictionary(K::KEY_TYPE)
+        );
+
+        let key_builder = ArrayDataBuilder::new(key.clone())
+            .buffers(vec![data.buffers()[0].clone()])
+            .offset(data.offset())
+            .len(data.len())
+            .nulls(data.nulls().cloned());
+
+        // Safety: Dictionary is valid
+        let key_data = unsafe { key_builder.build_unchecked() };
+        let keys = PrimitiveArray::from_data(&key_data);
+        let values = from_data(&data.child_data()[0]);
+
+        Self {
+            data_type,
+            keys,
+            values,
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/array/dictionary/ffi.rs b/crates/nano-arrow/src/array/dictionary/ffi.rs
new file mode 100644
index 000000000000..946c850c48b1
--- /dev/null
+++ b/crates/nano-arrow/src/array/dictionary/ffi.rs
@@ -0,0 +1,41 @@
+use super::{DictionaryArray, DictionaryKey};
+use crate::array::{FromFfi, PrimitiveArray, ToFfi};
+use crate::error::Error;
+use crate::ffi;
+
+unsafe impl<K: DictionaryKey> ToFfi for DictionaryArray<K> {
+    fn buffers(&self) -> Vec<Option<*const u8>> {
+        self.keys.buffers()
+    }
+
+    fn offset(&self) -> Option<usize> {
+        self.keys.offset()
+    }
+
+    fn to_ffi_aligned(&self) -> Self {
+        Self {
+            data_type: self.data_type.clone(),
+            keys: self.keys.to_ffi_aligned(),
+            values: self.values.clone(),
+        }
+    }
+}
+
+impl<K: DictionaryKey, A: ffi::ArrowArrayRef> FromFfi<A> for DictionaryArray<K> {
+    unsafe fn try_from_ffi(array: A) -> Result<Self, Error> {
+        // keys: similar to PrimitiveArray, but the datatype is the inner one
+        let validity = unsafe { array.validity() }?;
+        let values = unsafe { array.buffer::<K>(1) }?;
+
+        let data_type = array.data_type().clone();
+
+        let keys = PrimitiveArray::<K>::try_new(K::PRIMITIVE.into(), values, validity)?;
+        let values = array
+            .dictionary()?
+            .ok_or_else(|| Error::oos("Dictionary Array must contain a dictionary in ffi"))?;
+        let values = ffi::try_from(values)?;
+
+        // the assumption of this trait
+        DictionaryArray::<K>::try_new_unchecked(data_type, keys, values)
+    }
+}
diff --git a/crates/nano-arrow/src/array/dictionary/fmt.rs b/crates/nano-arrow/src/array/dictionary/fmt.rs
new file mode 100644
index 000000000000..b3ce55515902
--- /dev/null
+++ b/crates/nano-arrow/src/array/dictionary/fmt.rs
@@ -0,0 +1,31 @@
+use std::fmt::{Debug, Formatter, Result, Write};
+
+use super::super::fmt::{get_display, write_vec};
+use super::{DictionaryArray, DictionaryKey};
+use crate::array::Array;
+
+pub fn write_value<K: DictionaryKey, W: Write>(
+    array: &DictionaryArray<K>,
+    index: usize,
+    null: &'static str,
+    f: &mut W,
+) -> Result {
+    let keys = array.keys();
+    let values = array.values();
+
+    if keys.is_valid(index) {
+        let key = array.key_value(index);
+        get_display(values.as_ref(), null)(f, key)
+    } else {
+        write!(f, "{null}")
+    }
+}
+
+impl<K: DictionaryKey> Debug for DictionaryArray<K> {
+    fn fmt(&self, f: &mut Formatter<'_>) -> Result {
+        let writer = |f: &mut Formatter, index| write_value(self, index, "None", f);
+
+        write!(f, "DictionaryArray")?;
+        write_vec(f, writer, self.validity(), self.len(), "None", false)
+    }
+}
diff --git a/crates/nano-arrow/src/array/dictionary/iterator.rs b/crates/nano-arrow/src/array/dictionary/iterator.rs
new file mode 100644
index 000000000000..68e95ca86fed
--- /dev/null
+++ b/crates/nano-arrow/src/array/dictionary/iterator.rs
@@ -0,0 +1,67 @@
+use super::{DictionaryArray, DictionaryKey};
+use crate::bitmap::utils::{BitmapIter, ZipValidity};
+use crate::scalar::Scalar;
+use crate::trusted_len::TrustedLen;
+
+/// Iterator of values of an `ListArray`.
+pub struct DictionaryValuesIter<'a, K: DictionaryKey> {
+    array: &'a DictionaryArray<K>,
+    index: usize,
+    end: usize,
+}
+
+impl<'a, K: DictionaryKey> DictionaryValuesIter<'a, K> {
+    #[inline]
+    pub fn new(array: &'a DictionaryArray<K>) -> Self {
+        Self {
+            array,
+            index: 0,
+            end: array.len(),
+        }
+    }
+}
+
+impl<'a, K: DictionaryKey> Iterator for DictionaryValuesIter<'a, K> {
+    type Item = Box<dyn Scalar>;
+
+    #[inline]
+    fn next(&mut self) -> Option<Self::Item> {
+        if self.index == self.end {
+            return None;
+        }
+        let old = self.index;
+        self.index += 1;
+        Some(self.array.value(old))
+    }
+
+    #[inline]
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        (self.end - self.index, Some(self.end - self.index))
+    }
+}
+
+unsafe impl<'a, K: DictionaryKey> TrustedLen for DictionaryValuesIter<'a, K> {}
+
+impl<'a, K: DictionaryKey> DoubleEndedIterator for DictionaryValuesIter<'a, K> {
+    #[inline]
+    fn next_back(&mut self) -> Option<Self::Item> {
+        if self.index == self.end {
+            None
+        } else {
+            self.end -= 1;
+            Some(self.array.value(self.end))
+        }
+    }
+}
+
+type ValuesIter<'a, K> = DictionaryValuesIter<'a, K>;
+type ZipIter<'a, K> = ZipValidity<Box<dyn Scalar>, ValuesIter<'a, K>, BitmapIter<'a>>;
+
+impl<'a, K: DictionaryKey> IntoIterator for &'a DictionaryArray<K> {
+    type Item = Option<Box<dyn Scalar>>;
+    type IntoIter = ZipIter<'a, K>;
+
+    fn into_iter(self) -> Self::IntoIter {
+        self.iter()
+    }
+}
diff --git a/crates/nano-arrow/src/array/dictionary/mod.rs b/crates/nano-arrow/src/array/dictionary/mod.rs
new file mode 100644
index 000000000000..2ffb08c01c40
--- /dev/null
+++ b/crates/nano-arrow/src/array/dictionary/mod.rs
@@ -0,0 +1,413 @@
+use std::hash::Hash;
+use std::hint::unreachable_unchecked;
+
+use crate::bitmap::utils::{BitmapIter, ZipValidity};
+use crate::bitmap::Bitmap;
+use crate::datatypes::{DataType, IntegerType};
+use crate::error::Error;
+use crate::scalar::{new_scalar, Scalar};
+use crate::trusted_len::TrustedLen;
+use crate::types::NativeType;
+
+#[cfg(feature = "arrow")]
+mod data;
+mod ffi;
+pub(super) mod fmt;
+mod iterator;
+mod mutable;
+use crate::array::specification::check_indexes_unchecked;
+mod typed_iterator;
+mod value_map;
+
+pub use iterator::*;
+pub use mutable::*;
+
+use super::primitive::PrimitiveArray;
+use super::specification::check_indexes;
+use super::{new_empty_array, new_null_array, Array};
+use crate::array::dictionary::typed_iterator::{DictValue, DictionaryValuesIterTyped};
+
+/// Trait denoting [`NativeType`]s that can be used as keys of a dictionary.
+/// # Safety
+///
+/// Any implementation of this trait must ensure that `always_fits_usize` only
+/// returns `true` if all values succeeds on `value::try_into::<usize>().unwrap()`.
+pub unsafe trait DictionaryKey: NativeType + TryInto<usize> + TryFrom<usize> + Hash {
+    /// The corresponding [`IntegerType`] of this key
+    const KEY_TYPE: IntegerType;
+
+    /// Represents this key as a `usize`.
+    /// # Safety
+    /// The caller _must_ have checked that the value can be casted to `usize`.
+    #[inline]
+    unsafe fn as_usize(self) -> usize {
+        match self.try_into() {
+            Ok(v) => v,
+            Err(_) => unreachable_unchecked(),
+        }
+    }
+
+    /// If the key type always can be converted to `usize`.
+    fn always_fits_usize() -> bool {
+        false
+    }
+}
+
+unsafe impl DictionaryKey for i8 {
+    const KEY_TYPE: IntegerType = IntegerType::Int8;
+}
+unsafe impl DictionaryKey for i16 {
+    const KEY_TYPE: IntegerType = IntegerType::Int16;
+}
+unsafe impl DictionaryKey for i32 {
+    const KEY_TYPE: IntegerType = IntegerType::Int32;
+}
+unsafe impl DictionaryKey for i64 {
+    const KEY_TYPE: IntegerType = IntegerType::Int64;
+}
+unsafe impl DictionaryKey for u8 {
+    const KEY_TYPE: IntegerType = IntegerType::UInt8;
+
+    fn always_fits_usize() -> bool {
+        true
+    }
+}
+unsafe impl DictionaryKey for u16 {
+    const KEY_TYPE: IntegerType = IntegerType::UInt16;
+
+    fn always_fits_usize() -> bool {
+        true
+    }
+}
+unsafe impl DictionaryKey for u32 {
+    const KEY_TYPE: IntegerType = IntegerType::UInt32;
+
+    fn always_fits_usize() -> bool {
+        true
+    }
+}
+unsafe impl DictionaryKey for u64 {
+    const KEY_TYPE: IntegerType = IntegerType::UInt64;
+
+    #[cfg(target_pointer_width = "64")]
+    fn always_fits_usize() -> bool {
+        true
+    }
+}
+
+/// An [`Array`] whose values are stored as indices. This [`Array`] is useful when the cardinality of
+/// values is low compared to the length of the [`Array`].
+///
+/// # Safety
+/// This struct guarantees that each item of [`DictionaryArray::keys`] is castable to `usize` and
+/// its value is smaller than [`DictionaryArray::values`]`.len()`. In other words, you can safely
+/// use `unchecked` calls to retrieve the values
+#[derive(Clone)]
+pub struct DictionaryArray<K: DictionaryKey> {
+    data_type: DataType,
+    keys: PrimitiveArray<K>,
+    values: Box<dyn Array>,
+}
+
+fn check_data_type(
+    key_type: IntegerType,
+    data_type: &DataType,
+    values_data_type: &DataType,
+) -> Result<(), Error> {
+    if let DataType::Dictionary(key, value, _) = data_type.to_logical_type() {
+        if *key != key_type {
+            return Err(Error::oos(
+                "DictionaryArray must be initialized with a DataType::Dictionary whose integer is compatible to its keys",
+            ));
+        }
+        if value.as_ref().to_logical_type() != values_data_type.to_logical_type() {
+            return Err(Error::oos(
+                "DictionaryArray must be initialized with a DataType::Dictionary whose value is equal to its values",
+            ));
+        }
+    } else {
+        return Err(Error::oos(
+            "DictionaryArray must be initialized with logical DataType::Dictionary",
+        ));
+    }
+    Ok(())
+}
+
+impl<K: DictionaryKey> DictionaryArray<K> {
+    /// Returns a new [`DictionaryArray`].
+    /// # Implementation
+    /// This function is `O(N)` where `N` is the length of keys
+    /// # Errors
+    /// This function errors iff
+    /// * the `data_type`'s logical type is not a `DictionaryArray`
+    /// * the `data_type`'s keys is not compatible with `keys`
+    /// * the `data_type`'s values's data_type is not equal with `values.data_type()`
+    /// * any of the keys's values is not represented in `usize` or is `>= values.len()`
+    pub fn try_new(
+        data_type: DataType,
+        keys: PrimitiveArray<K>,
+        values: Box<dyn Array>,
+    ) -> Result<Self, Error> {
+        check_data_type(K::KEY_TYPE, &data_type, values.data_type())?;
+
+        if keys.null_count() != keys.len() {
+            if K::always_fits_usize() {
+                // safety: we just checked that conversion to `usize` always
+                // succeeds
+                unsafe { check_indexes_unchecked(keys.values(), values.len()) }?;
+            } else {
+                check_indexes(keys.values(), values.len())?;
+            }
+        }
+
+        Ok(Self {
+            data_type,
+            keys,
+            values,
+        })
+    }
+
+    /// Returns a new [`DictionaryArray`].
+    /// # Implementation
+    /// This function is `O(N)` where `N` is the length of keys
+    /// # Errors
+    /// This function errors iff
+    /// * any of the keys's values is not represented in `usize` or is `>= values.len()`
+    pub fn try_from_keys(keys: PrimitiveArray<K>, values: Box<dyn Array>) -> Result<Self, Error> {
+        let data_type = Self::default_data_type(values.data_type().clone());
+        Self::try_new(data_type, keys, values)
+    }
+
+    /// Returns a new [`DictionaryArray`].
+    /// # Errors
+    /// This function errors iff
+    /// * the `data_type`'s logical type is not a `DictionaryArray`
+    /// * the `data_type`'s keys is not compatible with `keys`
+    /// * the `data_type`'s values's data_type is not equal with `values.data_type()`
+    /// # Safety
+    /// The caller must ensure that every keys's values is represented in `usize` and is `< values.len()`
+    pub unsafe fn try_new_unchecked(
+        data_type: DataType,
+        keys: PrimitiveArray<K>,
+        values: Box<dyn Array>,
+    ) -> Result<Self, Error> {
+        check_data_type(K::KEY_TYPE, &data_type, values.data_type())?;
+
+        Ok(Self {
+            data_type,
+            keys,
+            values,
+        })
+    }
+
+    /// Returns a new empty [`DictionaryArray`].
+    pub fn new_empty(data_type: DataType) -> Self {
+        let values = Self::try_get_child(&data_type).unwrap();
+        let values = new_empty_array(values.clone());
+        Self::try_new(
+            data_type,
+            PrimitiveArray::<K>::new_empty(K::PRIMITIVE.into()),
+            values,
+        )
+        .unwrap()
+    }
+
+    /// Returns an [`DictionaryArray`] whose all elements are null
+    #[inline]
+    pub fn new_null(data_type: DataType, length: usize) -> Self {
+        let values = Self::try_get_child(&data_type).unwrap();
+        let values = new_null_array(values.clone(), 1);
+        Self::try_new(
+            data_type,
+            PrimitiveArray::<K>::new_null(K::PRIMITIVE.into(), length),
+            values,
+        )
+        .unwrap()
+    }
+
+    /// Returns an iterator of [`Option<Box<dyn Scalar>>`].
+    /// # Implementation
+    /// This function will allocate a new [`Scalar`] per item and is usually not performant.
+    /// Consider calling `keys_iter` and `values`, downcasting `values`, and iterating over that.
+    pub fn iter(&self) -> ZipValidity<Box<dyn Scalar>, DictionaryValuesIter<K>, BitmapIter> {
+        ZipValidity::new_with_validity(DictionaryValuesIter::new(self), self.keys.validity())
+    }
+
+    /// Returns an iterator of [`Box<dyn Scalar>`]
+    /// # Implementation
+    /// This function will allocate a new [`Scalar`] per item and is usually not performant.
+    /// Consider calling `keys_iter` and `values`, downcasting `values`, and iterating over that.
+    pub fn values_iter(&self) -> DictionaryValuesIter<K> {
+        DictionaryValuesIter::new(self)
+    }
+
+    /// Returns an iterator over the the values [`V::IterValue`].
+    ///
+    /// # Panics
+    ///
+    /// Panics if the keys of this [`DictionaryArray`] have any null types.
+    /// If they do [`DictionaryArray::iter_typed`] should be called
+    pub fn values_iter_typed<V: DictValue>(
+        &self,
+    ) -> Result<DictionaryValuesIterTyped<K, V>, Error> {
+        let keys = &self.keys;
+        assert_eq!(keys.null_count(), 0);
+        let values = self.values.as_ref();
+        let values = V::downcast_values(values)?;
+        Ok(unsafe { DictionaryValuesIterTyped::new(keys, values) })
+    }
+
+    /// Returns an iterator over the the optional values of  [`Option<V::IterValue>`].
+    ///
+    /// # Panics
+    ///
+    /// This function panics if the `values` array
+    pub fn iter_typed<V: DictValue>(
+        &self,
+    ) -> Result<ZipValidity<V::IterValue<'_>, DictionaryValuesIterTyped<K, V>, BitmapIter>, Error>
+    {
+        let keys = &self.keys;
+        let values = self.values.as_ref();
+        let values = V::downcast_values(values)?;
+        let values_iter = unsafe { DictionaryValuesIterTyped::new(keys, values) };
+        Ok(ZipValidity::new_with_validity(values_iter, self.validity()))
+    }
+
+    /// Returns the [`DataType`] of this [`DictionaryArray`]
+    #[inline]
+    pub fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    /// Returns whether the values of this [`DictionaryArray`] are ordered
+    #[inline]
+    pub fn is_ordered(&self) -> bool {
+        match self.data_type.to_logical_type() {
+            DataType::Dictionary(_, _, is_ordered) => *is_ordered,
+            _ => unreachable!(),
+        }
+    }
+
+    pub(crate) fn default_data_type(values_datatype: DataType) -> DataType {
+        DataType::Dictionary(K::KEY_TYPE, Box::new(values_datatype), false)
+    }
+
+    /// Slices this [`DictionaryArray`].
+    /// # Panics
+    /// iff `offset + length > self.len()`.
+    pub fn slice(&mut self, offset: usize, length: usize) {
+        self.keys.slice(offset, length);
+    }
+
+    /// Slices this [`DictionaryArray`].
+    /// # Safety
+    /// Safe iff `offset + length <= self.len()`.
+    pub unsafe fn slice_unchecked(&mut self, offset: usize, length: usize) {
+        self.keys.slice_unchecked(offset, length);
+    }
+
+    impl_sliced!();
+
+    /// Returns this [`DictionaryArray`] with a new validity.
+    /// # Panic
+    /// This function panics iff `validity.len() != self.len()`.
+    #[must_use]
+    pub fn with_validity(mut self, validity: Option<Bitmap>) -> Self {
+        self.set_validity(validity);
+        self
+    }
+
+    /// Sets the validity of the keys of this [`DictionaryArray`].
+    /// # Panics
+    /// This function panics iff `validity.len() != self.len()`.
+    pub fn set_validity(&mut self, validity: Option<Bitmap>) {
+        self.keys.set_validity(validity);
+    }
+
+    impl_into_array!();
+
+    /// Returns the length of this array
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.keys.len()
+    }
+
+    /// The optional validity. Equivalent to `self.keys().validity()`.
+    #[inline]
+    pub fn validity(&self) -> Option<&Bitmap> {
+        self.keys.validity()
+    }
+
+    /// Returns the keys of the [`DictionaryArray`]. These keys can be used to fetch values
+    /// from `values`.
+    #[inline]
+    pub fn keys(&self) -> &PrimitiveArray<K> {
+        &self.keys
+    }
+
+    /// Returns an iterator of the keys' values of the [`DictionaryArray`] as `usize`
+    #[inline]
+    pub fn keys_values_iter(&self) -> impl TrustedLen<Item = usize> + Clone + '_ {
+        // safety - invariant of the struct
+        self.keys.values_iter().map(|x| unsafe { x.as_usize() })
+    }
+
+    /// Returns an iterator of the keys' of the [`DictionaryArray`] as `usize`
+    #[inline]
+    pub fn keys_iter(&self) -> impl TrustedLen<Item = Option<usize>> + Clone + '_ {
+        // safety - invariant of the struct
+        self.keys.iter().map(|x| x.map(|x| unsafe { x.as_usize() }))
+    }
+
+    /// Returns the keys' value of the [`DictionaryArray`] as `usize`
+    /// # Panics
+    /// This function panics iff `index >= self.len()`
+    #[inline]
+    pub fn key_value(&self, index: usize) -> usize {
+        // safety - invariant of the struct
+        unsafe { self.keys.values()[index].as_usize() }
+    }
+
+    /// Returns the values of the [`DictionaryArray`].
+    #[inline]
+    pub fn values(&self) -> &Box<dyn Array> {
+        &self.values
+    }
+
+    /// Returns the value of the [`DictionaryArray`] at position `i`.
+    /// # Implementation
+    /// This function will allocate a new [`Scalar`] and is usually not performant.
+    /// Consider calling `keys` and `values`, downcasting `values`, and iterating over that.
+    /// # Panic
+    /// This function panics iff `index >= self.len()`
+    #[inline]
+    pub fn value(&self, index: usize) -> Box<dyn Scalar> {
+        // safety - invariant of this struct
+        let index = unsafe { self.keys.value(index).as_usize() };
+        new_scalar(self.values.as_ref(), index)
+    }
+
+    pub(crate) fn try_get_child(data_type: &DataType) -> Result<&DataType, Error> {
+        Ok(match data_type.to_logical_type() {
+            DataType::Dictionary(_, values, _) => values.as_ref(),
+            _ => {
+                return Err(Error::oos(
+                    "Dictionaries must be initialized with DataType::Dictionary",
+                ))
+            },
+        })
+    }
+}
+
+impl<K: DictionaryKey> Array for DictionaryArray<K> {
+    impl_common_array!();
+
+    fn validity(&self) -> Option<&Bitmap> {
+        self.keys.validity()
+    }
+
+    #[inline]
+    fn with_validity(&self, validity: Option<Bitmap>) -> Box<dyn Array> {
+        Box::new(self.clone().with_validity(validity))
+    }
+}
diff --git a/crates/nano-arrow/src/array/dictionary/mutable.rs b/crates/nano-arrow/src/array/dictionary/mutable.rs
new file mode 100644
index 000000000000..dedd6ead0eaa
--- /dev/null
+++ b/crates/nano-arrow/src/array/dictionary/mutable.rs
@@ -0,0 +1,241 @@
+use std::hash::Hash;
+use std::sync::Arc;
+
+use super::value_map::ValueMap;
+use super::{DictionaryArray, DictionaryKey};
+use crate::array::indexable::{AsIndexed, Indexable};
+use crate::array::primitive::MutablePrimitiveArray;
+use crate::array::{Array, MutableArray, TryExtend, TryPush};
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::DataType;
+use crate::error::Result;
+
+/// A mutable, strong-typed version of [`DictionaryArray`].
+///
+/// # Example
+/// Building a UTF8 dictionary with `i32` keys.
+/// ```
+/// # use arrow2::array::{MutableDictionaryArray, MutableUtf8Array, TryPush};
+/// # fn main() -> Result<(), Box<dyn std::error::Error>> {
+/// let mut array: MutableDictionaryArray<i32, MutableUtf8Array<i32>> = MutableDictionaryArray::new();
+/// array.try_push(Some("A"))?;
+/// array.try_push(Some("B"))?;
+/// array.push_null();
+/// array.try_push(Some("C"))?;
+/// # Ok(())
+/// # }
+/// ```
+#[derive(Debug)]
+pub struct MutableDictionaryArray<K: DictionaryKey, M: MutableArray> {
+    data_type: DataType,
+    map: ValueMap<K, M>,
+    // invariant: `max(keys) < map.values().len()`
+    keys: MutablePrimitiveArray<K>,
+}
+
+impl<K: DictionaryKey, M: MutableArray> From<MutableDictionaryArray<K, M>> for DictionaryArray<K> {
+    fn from(other: MutableDictionaryArray<K, M>) -> Self {
+        // Safety - the invariant of this struct ensures that this is up-held
+        unsafe {
+            DictionaryArray::<K>::try_new_unchecked(
+                other.data_type,
+                other.keys.into(),
+                other.map.into_values().as_box(),
+            )
+            .unwrap()
+        }
+    }
+}
+
+impl<K: DictionaryKey, M: MutableArray + Default> MutableDictionaryArray<K, M> {
+    /// Creates an empty [`MutableDictionaryArray`].
+    pub fn new() -> Self {
+        Self::try_empty(M::default()).unwrap()
+    }
+}
+
+impl<K: DictionaryKey, M: MutableArray + Default> Default for MutableDictionaryArray<K, M> {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl<K: DictionaryKey, M: MutableArray> MutableDictionaryArray<K, M> {
+    /// Creates an empty [`MutableDictionaryArray`] from a given empty values array.
+    /// # Errors
+    /// Errors if the array is non-empty.
+    pub fn try_empty(values: M) -> Result<Self> {
+        Ok(Self::from_value_map(ValueMap::<K, M>::try_empty(values)?))
+    }
+
+    /// Creates an empty [`MutableDictionaryArray`] preloaded with a given dictionary of values.
+    /// Indices associated with those values are automatically assigned based on the order of
+    /// the values.
+    /// # Errors
+    /// Errors if there's more values than the maximum value of `K` or if values are not unique.
+    pub fn from_values(values: M) -> Result<Self>
+    where
+        M: Indexable,
+        M::Type: Eq + Hash,
+    {
+        Ok(Self::from_value_map(ValueMap::<K, M>::from_values(values)?))
+    }
+
+    fn from_value_map(value_map: ValueMap<K, M>) -> Self {
+        let keys = MutablePrimitiveArray::<K>::new();
+        let data_type =
+            DataType::Dictionary(K::KEY_TYPE, Box::new(value_map.data_type().clone()), false);
+        Self {
+            data_type,
+            map: value_map,
+            keys,
+        }
+    }
+
+    /// Creates an empty [`MutableDictionaryArray`] retaining the same dictionary as the current
+    /// mutable dictionary array, but with no data. This may come useful when serializing the
+    /// array into multiple chunks, where there's a requirement that the dictionary is the same.
+    /// No copying is performed, the value map is moved over to the new array.
+    pub fn into_empty(self) -> Self {
+        Self::from_value_map(self.map)
+    }
+
+    /// Same as `into_empty` but clones the inner value map instead of taking full ownership.
+    pub fn to_empty(&self) -> Self
+    where
+        M: Clone,
+    {
+        Self::from_value_map(self.map.clone())
+    }
+
+    /// pushes a null value
+    pub fn push_null(&mut self) {
+        self.keys.push(None)
+    }
+
+    /// returns a reference to the inner values.
+    pub fn values(&self) -> &M {
+        self.map.values()
+    }
+
+    /// converts itself into [`Arc<dyn Array>`]
+    pub fn into_arc(self) -> Arc<dyn Array> {
+        let a: DictionaryArray<K> = self.into();
+        Arc::new(a)
+    }
+
+    /// converts itself into [`Box<dyn Array>`]
+    pub fn into_box(self) -> Box<dyn Array> {
+        let a: DictionaryArray<K> = self.into();
+        Box::new(a)
+    }
+
+    /// Reserves `additional` slots.
+    pub fn reserve(&mut self, additional: usize) {
+        self.keys.reserve(additional);
+    }
+
+    /// Shrinks the capacity of the [`MutableDictionaryArray`] to fit its current length.
+    pub fn shrink_to_fit(&mut self) {
+        self.map.shrink_to_fit();
+        self.keys.shrink_to_fit();
+    }
+
+    /// Returns the dictionary keys
+    pub fn keys(&self) -> &MutablePrimitiveArray<K> {
+        &self.keys
+    }
+
+    fn take_into(&mut self) -> DictionaryArray<K> {
+        DictionaryArray::<K>::try_new(
+            self.data_type.clone(),
+            std::mem::take(&mut self.keys).into(),
+            self.map.take_into(),
+        )
+        .unwrap()
+    }
+}
+
+impl<K: DictionaryKey, M: 'static + MutableArray> MutableArray for MutableDictionaryArray<K, M> {
+    fn len(&self) -> usize {
+        self.keys.len()
+    }
+
+    fn validity(&self) -> Option<&MutableBitmap> {
+        self.keys.validity()
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        Box::new(self.take_into())
+    }
+
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        Arc::new(self.take_into())
+    }
+
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    fn as_mut_any(&mut self) -> &mut dyn std::any::Any {
+        self
+    }
+
+    fn push_null(&mut self) {
+        self.keys.push(None)
+    }
+
+    fn reserve(&mut self, additional: usize) {
+        self.reserve(additional)
+    }
+
+    fn shrink_to_fit(&mut self) {
+        self.shrink_to_fit()
+    }
+}
+
+impl<K, M, T> TryExtend<Option<T>> for MutableDictionaryArray<K, M>
+where
+    K: DictionaryKey,
+    M: MutableArray + Indexable + TryExtend<Option<T>>,
+    T: AsIndexed<M>,
+    M::Type: Eq + Hash,
+{
+    fn try_extend<II: IntoIterator<Item = Option<T>>>(&mut self, iter: II) -> Result<()> {
+        for value in iter {
+            if let Some(value) = value {
+                let key = self
+                    .map
+                    .try_push_valid(value, |arr, v| arr.try_extend(std::iter::once(Some(v))))?;
+                self.keys.try_push(Some(key))?;
+            } else {
+                self.push_null();
+            }
+        }
+        Ok(())
+    }
+}
+
+impl<K, M, T> TryPush<Option<T>> for MutableDictionaryArray<K, M>
+where
+    K: DictionaryKey,
+    M: MutableArray + Indexable + TryPush<Option<T>>,
+    T: AsIndexed<M>,
+    M::Type: Eq + Hash,
+{
+    fn try_push(&mut self, item: Option<T>) -> Result<()> {
+        if let Some(value) = item {
+            let key = self
+                .map
+                .try_push_valid(value, |arr, v| arr.try_push(Some(v)))?;
+            self.keys.try_push(Some(key))?;
+        } else {
+            self.push_null();
+        }
+        Ok(())
+    }
+}
diff --git a/crates/nano-arrow/src/array/dictionary/typed_iterator.rs b/crates/nano-arrow/src/array/dictionary/typed_iterator.rs
new file mode 100644
index 000000000000..fd68942051aa
--- /dev/null
+++ b/crates/nano-arrow/src/array/dictionary/typed_iterator.rs
@@ -0,0 +1,110 @@
+use super::DictionaryKey;
+use crate::array::{Array, PrimitiveArray, Utf8Array};
+use crate::error::{Error, Result};
+use crate::trusted_len::TrustedLen;
+use crate::types::Offset;
+
+pub trait DictValue {
+    type IterValue<'this>
+    where
+        Self: 'this;
+
+    /// # Safety
+    /// Will not do any bound checks but must check validity.
+    unsafe fn get_unchecked(&self, item: usize) -> Self::IterValue<'_>;
+
+    /// Take a [`dyn Array`] an try to downcast it to the type of `DictValue`.
+    fn downcast_values(array: &dyn Array) -> Result<&Self>
+    where
+        Self: Sized;
+}
+
+impl<O: Offset> DictValue for Utf8Array<O> {
+    type IterValue<'a> = &'a str;
+
+    unsafe fn get_unchecked(&self, item: usize) -> Self::IterValue<'_> {
+        self.value_unchecked(item)
+    }
+
+    fn downcast_values(array: &dyn Array) -> Result<&Self>
+    where
+        Self: Sized,
+    {
+        array
+            .as_any()
+            .downcast_ref::<Self>()
+            .ok_or(Error::InvalidArgumentError(
+                "could not convert array to dictionary value".into(),
+            ))
+            .map(|arr| {
+                assert_eq!(
+                    arr.null_count(),
+                    0,
+                    "null values in values not supported in iteration"
+                );
+                arr
+            })
+    }
+}
+
+/// Iterator of values of an `ListArray`.
+pub struct DictionaryValuesIterTyped<'a, K: DictionaryKey, V: DictValue> {
+    keys: &'a PrimitiveArray<K>,
+    values: &'a V,
+    index: usize,
+    end: usize,
+}
+
+impl<'a, K: DictionaryKey, V: DictValue> DictionaryValuesIterTyped<'a, K, V> {
+    pub(super) unsafe fn new(keys: &'a PrimitiveArray<K>, values: &'a V) -> Self {
+        Self {
+            keys,
+            values,
+            index: 0,
+            end: keys.len(),
+        }
+    }
+}
+
+impl<'a, K: DictionaryKey, V: DictValue> Iterator for DictionaryValuesIterTyped<'a, K, V> {
+    type Item = V::IterValue<'a>;
+
+    #[inline]
+    fn next(&mut self) -> Option<Self::Item> {
+        if self.index == self.end {
+            return None;
+        }
+        let old = self.index;
+        self.index += 1;
+        unsafe {
+            let key = self.keys.value_unchecked(old);
+            let idx = key.as_usize();
+            Some(self.values.get_unchecked(idx))
+        }
+    }
+
+    #[inline]
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        (self.end - self.index, Some(self.end - self.index))
+    }
+}
+
+unsafe impl<'a, K: DictionaryKey, V: DictValue> TrustedLen for DictionaryValuesIterTyped<'a, K, V> {}
+
+impl<'a, K: DictionaryKey, V: DictValue> DoubleEndedIterator
+    for DictionaryValuesIterTyped<'a, K, V>
+{
+    #[inline]
+    fn next_back(&mut self) -> Option<Self::Item> {
+        if self.index == self.end {
+            None
+        } else {
+            self.end -= 1;
+            unsafe {
+                let key = self.keys.value_unchecked(self.end);
+                let idx = key.as_usize();
+                Some(self.values.get_unchecked(idx))
+            }
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/array/dictionary/value_map.rs b/crates/nano-arrow/src/array/dictionary/value_map.rs
new file mode 100644
index 000000000000..5a12534766bd
--- /dev/null
+++ b/crates/nano-arrow/src/array/dictionary/value_map.rs
@@ -0,0 +1,171 @@
+use std::borrow::Borrow;
+use std::fmt::{self, Debug};
+use std::hash::{BuildHasher, BuildHasherDefault, Hash, Hasher};
+
+use hashbrown::hash_map::RawEntryMut;
+use hashbrown::HashMap;
+
+use super::DictionaryKey;
+use crate::array::indexable::{AsIndexed, Indexable};
+use crate::array::{Array, MutableArray};
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+
+/// Hasher for pre-hashed values; similar to `hash_hasher` but with native endianness.
+///
+/// We know that we'll only use it for `u64` values, so we can avoid endian conversion.
+///
+/// Invariant: hash of a u64 value is always equal to itself.
+#[derive(Copy, Clone, Default)]
+pub struct PassthroughHasher(u64);
+
+impl Hasher for PassthroughHasher {
+    #[inline]
+    fn write_u64(&mut self, value: u64) {
+        self.0 = value;
+    }
+
+    fn write(&mut self, _: &[u8]) {
+        unreachable!();
+    }
+
+    #[inline]
+    fn finish(&self) -> u64 {
+        self.0
+    }
+}
+
+#[derive(Clone)]
+pub struct Hashed<K> {
+    hash: u64,
+    key: K,
+}
+
+#[inline]
+fn ahash_hash<T: Hash + ?Sized>(value: &T) -> u64 {
+    let mut hasher = BuildHasherDefault::<ahash::AHasher>::default().build_hasher();
+    value.hash(&mut hasher);
+    hasher.finish()
+}
+
+impl<K> Hash for Hashed<K> {
+    #[inline]
+    fn hash<H: Hasher>(&self, state: &mut H) {
+        self.hash.hash(state)
+    }
+}
+
+#[derive(Clone)]
+pub struct ValueMap<K: DictionaryKey, M: MutableArray> {
+    pub values: M,
+    pub map: HashMap<Hashed<K>, (), BuildHasherDefault<PassthroughHasher>>, // NB: *only* use insert_hashed_nocheck() and no other hashmap API
+}
+
+impl<K: DictionaryKey, M: MutableArray> ValueMap<K, M> {
+    pub fn try_empty(values: M) -> Result<Self> {
+        if !values.is_empty() {
+            return Err(Error::InvalidArgumentError(
+                "initializing value map with non-empty values array".into(),
+            ));
+        }
+        Ok(Self {
+            values,
+            map: HashMap::default(),
+        })
+    }
+
+    pub fn from_values(values: M) -> Result<Self>
+    where
+        M: Indexable,
+        M::Type: Eq + Hash,
+    {
+        let mut map = HashMap::<Hashed<K>, _, _>::with_capacity_and_hasher(
+            values.len(),
+            BuildHasherDefault::<PassthroughHasher>::default(),
+        );
+        for index in 0..values.len() {
+            let key = K::try_from(index).map_err(|_| Error::Overflow)?;
+            // safety: we only iterate within bounds
+            let value = unsafe { values.value_unchecked_at(index) };
+            let hash = ahash_hash(value.borrow());
+            match map.raw_entry_mut().from_hash(hash, |item| {
+                // safety: invariant of the struct, it's always in bounds since we maintain it
+                let stored_value = unsafe { values.value_unchecked_at(item.key.as_usize()) };
+                stored_value.borrow() == value.borrow()
+            }) {
+                RawEntryMut::Occupied(_) => {
+                    return Err(Error::InvalidArgumentError(
+                        "duplicate value in dictionary values array".into(),
+                    ))
+                },
+                RawEntryMut::Vacant(entry) => {
+                    // NB: don't use .insert() here!
+                    entry.insert_hashed_nocheck(hash, Hashed { hash, key }, ());
+                },
+            }
+        }
+        Ok(Self { values, map })
+    }
+
+    pub fn data_type(&self) -> &DataType {
+        self.values.data_type()
+    }
+
+    pub fn into_values(self) -> M {
+        self.values
+    }
+
+    pub fn take_into(&mut self) -> Box<dyn Array> {
+        let arr = self.values.as_box();
+        self.map.clear();
+        arr
+    }
+
+    #[inline]
+    pub fn values(&self) -> &M {
+        &self.values
+    }
+
+    /// Try to insert a value and return its index (it may or may not get inserted).
+    pub fn try_push_valid<V>(
+        &mut self,
+        value: V,
+        mut push: impl FnMut(&mut M, V) -> Result<()>,
+    ) -> Result<K>
+    where
+        M: Indexable,
+        V: AsIndexed<M>,
+        M::Type: Eq + Hash,
+    {
+        let hash = ahash_hash(value.as_indexed());
+        Ok(
+            match self.map.raw_entry_mut().from_hash(hash, |item| {
+                // safety: we've already checked (the inverse) when we pushed it, so it should be ok?
+                let index = unsafe { item.key.as_usize() };
+                // safety: invariant of the struct, it's always in bounds since we maintain it
+                let stored_value = unsafe { self.values.value_unchecked_at(index) };
+                stored_value.borrow() == value.as_indexed()
+            }) {
+                RawEntryMut::Occupied(entry) => entry.key().key,
+                RawEntryMut::Vacant(entry) => {
+                    let index = self.values.len();
+                    let key = K::try_from(index).map_err(|_| Error::Overflow)?;
+                    entry.insert_hashed_nocheck(hash, Hashed { hash, key }, ()); // NB: don't use .insert() here!
+                    push(&mut self.values, value)?;
+                    debug_assert_eq!(self.values.len(), index + 1);
+                    key
+                },
+            },
+        )
+    }
+
+    pub fn shrink_to_fit(&mut self) {
+        self.values.shrink_to_fit();
+    }
+}
+
+impl<K: DictionaryKey, M: MutableArray> Debug for ValueMap<K, M> {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        self.values.fmt(f)
+    }
+}
diff --git a/crates/nano-arrow/src/array/equal/binary.rs b/crates/nano-arrow/src/array/equal/binary.rs
new file mode 100644
index 000000000000..bed8588efb59
--- /dev/null
+++ b/crates/nano-arrow/src/array/equal/binary.rs
@@ -0,0 +1,6 @@
+use crate::array::BinaryArray;
+use crate::offset::Offset;
+
+pub(super) fn equal<O: Offset>(lhs: &BinaryArray<O>, rhs: &BinaryArray<O>) -> bool {
+    lhs.data_type() == rhs.data_type() && lhs.len() == rhs.len() && lhs.iter().eq(rhs.iter())
+}
diff --git a/crates/nano-arrow/src/array/equal/boolean.rs b/crates/nano-arrow/src/array/equal/boolean.rs
new file mode 100644
index 000000000000..d9c6af9b0276
--- /dev/null
+++ b/crates/nano-arrow/src/array/equal/boolean.rs
@@ -0,0 +1,5 @@
+use crate::array::BooleanArray;
+
+pub(super) fn equal(lhs: &BooleanArray, rhs: &BooleanArray) -> bool {
+    lhs.len() == rhs.len() && lhs.iter().eq(rhs.iter())
+}
diff --git a/crates/nano-arrow/src/array/equal/dictionary.rs b/crates/nano-arrow/src/array/equal/dictionary.rs
new file mode 100644
index 000000000000..d65634095fb3
--- /dev/null
+++ b/crates/nano-arrow/src/array/equal/dictionary.rs
@@ -0,0 +1,14 @@
+use crate::array::{DictionaryArray, DictionaryKey};
+
+pub(super) fn equal<K: DictionaryKey>(lhs: &DictionaryArray<K>, rhs: &DictionaryArray<K>) -> bool {
+    if !(lhs.data_type() == rhs.data_type() && lhs.len() == rhs.len()) {
+        return false;
+    };
+
+    // if x is not valid and y is but its child is not, the slots are equal.
+    lhs.iter().zip(rhs.iter()).all(|(x, y)| match (&x, &y) {
+        (None, Some(y)) => !y.is_valid(),
+        (Some(x), None) => !x.is_valid(),
+        _ => x == y,
+    })
+}
diff --git a/crates/nano-arrow/src/array/equal/fixed_size_binary.rs b/crates/nano-arrow/src/array/equal/fixed_size_binary.rs
new file mode 100644
index 000000000000..883d5739778b
--- /dev/null
+++ b/crates/nano-arrow/src/array/equal/fixed_size_binary.rs
@@ -0,0 +1,5 @@
+use crate::array::{Array, FixedSizeBinaryArray};
+
+pub(super) fn equal(lhs: &FixedSizeBinaryArray, rhs: &FixedSizeBinaryArray) -> bool {
+    lhs.data_type() == rhs.data_type() && lhs.len() == rhs.len() && lhs.iter().eq(rhs.iter())
+}
diff --git a/crates/nano-arrow/src/array/equal/fixed_size_list.rs b/crates/nano-arrow/src/array/equal/fixed_size_list.rs
new file mode 100644
index 000000000000..aaf77910013f
--- /dev/null
+++ b/crates/nano-arrow/src/array/equal/fixed_size_list.rs
@@ -0,0 +1,5 @@
+use crate::array::{Array, FixedSizeListArray};
+
+pub(super) fn equal(lhs: &FixedSizeListArray, rhs: &FixedSizeListArray) -> bool {
+    lhs.data_type() == rhs.data_type() && lhs.len() == rhs.len() && lhs.iter().eq(rhs.iter())
+}
diff --git a/crates/nano-arrow/src/array/equal/list.rs b/crates/nano-arrow/src/array/equal/list.rs
new file mode 100644
index 000000000000..26faa1598faf
--- /dev/null
+++ b/crates/nano-arrow/src/array/equal/list.rs
@@ -0,0 +1,6 @@
+use crate::array::{Array, ListArray};
+use crate::offset::Offset;
+
+pub(super) fn equal<O: Offset>(lhs: &ListArray<O>, rhs: &ListArray<O>) -> bool {
+    lhs.data_type() == rhs.data_type() && lhs.len() == rhs.len() && lhs.iter().eq(rhs.iter())
+}
diff --git a/crates/nano-arrow/src/array/equal/map.rs b/crates/nano-arrow/src/array/equal/map.rs
new file mode 100644
index 000000000000..e150fb4a4b41
--- /dev/null
+++ b/crates/nano-arrow/src/array/equal/map.rs
@@ -0,0 +1,5 @@
+use crate::array::{Array, MapArray};
+
+pub(super) fn equal(lhs: &MapArray, rhs: &MapArray) -> bool {
+    lhs.data_type() == rhs.data_type() && lhs.len() == rhs.len() && lhs.iter().eq(rhs.iter())
+}
diff --git a/crates/nano-arrow/src/array/equal/mod.rs b/crates/nano-arrow/src/array/equal/mod.rs
new file mode 100644
index 000000000000..91fd0c2f464f
--- /dev/null
+++ b/crates/nano-arrow/src/array/equal/mod.rs
@@ -0,0 +1,287 @@
+use super::*;
+use crate::offset::Offset;
+use crate::types::NativeType;
+
+mod binary;
+mod boolean;
+mod dictionary;
+mod fixed_size_binary;
+mod fixed_size_list;
+mod list;
+mod map;
+mod null;
+mod primitive;
+mod struct_;
+mod union;
+mod utf8;
+
+impl PartialEq for dyn Array + '_ {
+    fn eq(&self, that: &dyn Array) -> bool {
+        equal(self, that)
+    }
+}
+
+impl PartialEq<dyn Array> for std::sync::Arc<dyn Array + '_> {
+    fn eq(&self, that: &dyn Array) -> bool {
+        equal(&**self, that)
+    }
+}
+
+impl PartialEq<dyn Array> for Box<dyn Array + '_> {
+    fn eq(&self, that: &dyn Array) -> bool {
+        equal(&**self, that)
+    }
+}
+
+impl PartialEq<NullArray> for NullArray {
+    fn eq(&self, other: &Self) -> bool {
+        null::equal(self, other)
+    }
+}
+
+impl PartialEq<&dyn Array> for NullArray {
+    fn eq(&self, other: &&dyn Array) -> bool {
+        equal(self, *other)
+    }
+}
+
+impl<T: NativeType> PartialEq<&dyn Array> for PrimitiveArray<T> {
+    fn eq(&self, other: &&dyn Array) -> bool {
+        equal(self, *other)
+    }
+}
+
+impl<T: NativeType> PartialEq<PrimitiveArray<T>> for &dyn Array {
+    fn eq(&self, other: &PrimitiveArray<T>) -> bool {
+        equal(*self, other)
+    }
+}
+
+impl<T: NativeType> PartialEq<PrimitiveArray<T>> for PrimitiveArray<T> {
+    fn eq(&self, other: &Self) -> bool {
+        primitive::equal::<T>(self, other)
+    }
+}
+
+impl PartialEq<BooleanArray> for BooleanArray {
+    fn eq(&self, other: &Self) -> bool {
+        equal(self, other)
+    }
+}
+
+impl PartialEq<&dyn Array> for BooleanArray {
+    fn eq(&self, other: &&dyn Array) -> bool {
+        equal(self, *other)
+    }
+}
+
+impl<O: Offset> PartialEq<Utf8Array<O>> for Utf8Array<O> {
+    fn eq(&self, other: &Self) -> bool {
+        utf8::equal(self, other)
+    }
+}
+
+impl<O: Offset> PartialEq<&dyn Array> for Utf8Array<O> {
+    fn eq(&self, other: &&dyn Array) -> bool {
+        equal(self, *other)
+    }
+}
+
+impl<O: Offset> PartialEq<Utf8Array<O>> for &dyn Array {
+    fn eq(&self, other: &Utf8Array<O>) -> bool {
+        equal(*self, other)
+    }
+}
+
+impl<O: Offset> PartialEq<BinaryArray<O>> for BinaryArray<O> {
+    fn eq(&self, other: &Self) -> bool {
+        binary::equal(self, other)
+    }
+}
+
+impl<O: Offset> PartialEq<&dyn Array> for BinaryArray<O> {
+    fn eq(&self, other: &&dyn Array) -> bool {
+        equal(self, *other)
+    }
+}
+
+impl<O: Offset> PartialEq<BinaryArray<O>> for &dyn Array {
+    fn eq(&self, other: &BinaryArray<O>) -> bool {
+        equal(*self, other)
+    }
+}
+
+impl PartialEq<FixedSizeBinaryArray> for FixedSizeBinaryArray {
+    fn eq(&self, other: &Self) -> bool {
+        fixed_size_binary::equal(self, other)
+    }
+}
+
+impl PartialEq<&dyn Array> for FixedSizeBinaryArray {
+    fn eq(&self, other: &&dyn Array) -> bool {
+        equal(self, *other)
+    }
+}
+
+impl<O: Offset> PartialEq<ListArray<O>> for ListArray<O> {
+    fn eq(&self, other: &Self) -> bool {
+        list::equal(self, other)
+    }
+}
+
+impl<O: Offset> PartialEq<&dyn Array> for ListArray<O> {
+    fn eq(&self, other: &&dyn Array) -> bool {
+        equal(self, *other)
+    }
+}
+
+impl PartialEq<FixedSizeListArray> for FixedSizeListArray {
+    fn eq(&self, other: &Self) -> bool {
+        fixed_size_list::equal(self, other)
+    }
+}
+
+impl PartialEq<&dyn Array> for FixedSizeListArray {
+    fn eq(&self, other: &&dyn Array) -> bool {
+        equal(self, *other)
+    }
+}
+
+impl PartialEq<StructArray> for StructArray {
+    fn eq(&self, other: &Self) -> bool {
+        struct_::equal(self, other)
+    }
+}
+
+impl PartialEq<&dyn Array> for StructArray {
+    fn eq(&self, other: &&dyn Array) -> bool {
+        equal(self, *other)
+    }
+}
+
+impl<K: DictionaryKey> PartialEq<DictionaryArray<K>> for DictionaryArray<K> {
+    fn eq(&self, other: &Self) -> bool {
+        dictionary::equal(self, other)
+    }
+}
+
+impl<K: DictionaryKey> PartialEq<&dyn Array> for DictionaryArray<K> {
+    fn eq(&self, other: &&dyn Array) -> bool {
+        equal(self, *other)
+    }
+}
+
+impl PartialEq<UnionArray> for UnionArray {
+    fn eq(&self, other: &Self) -> bool {
+        union::equal(self, other)
+    }
+}
+
+impl PartialEq<&dyn Array> for UnionArray {
+    fn eq(&self, other: &&dyn Array) -> bool {
+        equal(self, *other)
+    }
+}
+
+impl PartialEq<MapArray> for MapArray {
+    fn eq(&self, other: &Self) -> bool {
+        map::equal(self, other)
+    }
+}
+
+impl PartialEq<&dyn Array> for MapArray {
+    fn eq(&self, other: &&dyn Array) -> bool {
+        equal(self, *other)
+    }
+}
+
+/// Logically compares two [`Array`]s.
+/// Two arrays are logically equal if and only if:
+/// * their data types are equal
+/// * each of their items are equal
+pub fn equal(lhs: &dyn Array, rhs: &dyn Array) -> bool {
+    if lhs.data_type() != rhs.data_type() {
+        return false;
+    }
+
+    use crate::datatypes::PhysicalType::*;
+    match lhs.data_type().to_physical_type() {
+        Null => {
+            let lhs = lhs.as_any().downcast_ref().unwrap();
+            let rhs = rhs.as_any().downcast_ref().unwrap();
+            null::equal(lhs, rhs)
+        },
+        Boolean => {
+            let lhs = lhs.as_any().downcast_ref().unwrap();
+            let rhs = rhs.as_any().downcast_ref().unwrap();
+            boolean::equal(lhs, rhs)
+        },
+        Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+            let lhs = lhs.as_any().downcast_ref().unwrap();
+            let rhs = rhs.as_any().downcast_ref().unwrap();
+            primitive::equal::<$T>(lhs, rhs)
+        }),
+        Utf8 => {
+            let lhs = lhs.as_any().downcast_ref().unwrap();
+            let rhs = rhs.as_any().downcast_ref().unwrap();
+            utf8::equal::<i32>(lhs, rhs)
+        },
+        LargeUtf8 => {
+            let lhs = lhs.as_any().downcast_ref().unwrap();
+            let rhs = rhs.as_any().downcast_ref().unwrap();
+            utf8::equal::<i64>(lhs, rhs)
+        },
+        Binary => {
+            let lhs = lhs.as_any().downcast_ref().unwrap();
+            let rhs = rhs.as_any().downcast_ref().unwrap();
+            binary::equal::<i32>(lhs, rhs)
+        },
+        LargeBinary => {
+            let lhs = lhs.as_any().downcast_ref().unwrap();
+            let rhs = rhs.as_any().downcast_ref().unwrap();
+            binary::equal::<i64>(lhs, rhs)
+        },
+        List => {
+            let lhs = lhs.as_any().downcast_ref().unwrap();
+            let rhs = rhs.as_any().downcast_ref().unwrap();
+            list::equal::<i32>(lhs, rhs)
+        },
+        LargeList => {
+            let lhs = lhs.as_any().downcast_ref().unwrap();
+            let rhs = rhs.as_any().downcast_ref().unwrap();
+            list::equal::<i64>(lhs, rhs)
+        },
+        Struct => {
+            let lhs = lhs.as_any().downcast_ref::<StructArray>().unwrap();
+            let rhs = rhs.as_any().downcast_ref::<StructArray>().unwrap();
+            struct_::equal(lhs, rhs)
+        },
+        Dictionary(key_type) => {
+            match_integer_type!(key_type, |$T| {
+                let lhs = lhs.as_any().downcast_ref().unwrap();
+                let rhs = rhs.as_any().downcast_ref().unwrap();
+                dictionary::equal::<$T>(lhs, rhs)
+            })
+        },
+        FixedSizeBinary => {
+            let lhs = lhs.as_any().downcast_ref().unwrap();
+            let rhs = rhs.as_any().downcast_ref().unwrap();
+            fixed_size_binary::equal(lhs, rhs)
+        },
+        FixedSizeList => {
+            let lhs = lhs.as_any().downcast_ref().unwrap();
+            let rhs = rhs.as_any().downcast_ref().unwrap();
+            fixed_size_list::equal(lhs, rhs)
+        },
+        Union => {
+            let lhs = lhs.as_any().downcast_ref().unwrap();
+            let rhs = rhs.as_any().downcast_ref().unwrap();
+            union::equal(lhs, rhs)
+        },
+        Map => {
+            let lhs = lhs.as_any().downcast_ref().unwrap();
+            let rhs = rhs.as_any().downcast_ref().unwrap();
+            map::equal(lhs, rhs)
+        },
+    }
+}
diff --git a/crates/nano-arrow/src/array/equal/null.rs b/crates/nano-arrow/src/array/equal/null.rs
new file mode 100644
index 000000000000..11ad6cc133bb
--- /dev/null
+++ b/crates/nano-arrow/src/array/equal/null.rs
@@ -0,0 +1,6 @@
+use crate::array::{Array, NullArray};
+
+#[inline]
+pub(super) fn equal(lhs: &NullArray, rhs: &NullArray) -> bool {
+    lhs.len() == rhs.len()
+}
diff --git a/crates/nano-arrow/src/array/equal/primitive.rs b/crates/nano-arrow/src/array/equal/primitive.rs
new file mode 100644
index 000000000000..dc90bb15da5e
--- /dev/null
+++ b/crates/nano-arrow/src/array/equal/primitive.rs
@@ -0,0 +1,6 @@
+use crate::array::PrimitiveArray;
+use crate::types::NativeType;
+
+pub(super) fn equal<T: NativeType>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> bool {
+    lhs.data_type() == rhs.data_type() && lhs.len() == rhs.len() && lhs.iter().eq(rhs.iter())
+}
diff --git a/crates/nano-arrow/src/array/equal/struct_.rs b/crates/nano-arrow/src/array/equal/struct_.rs
new file mode 100644
index 000000000000..a1741e36368c
--- /dev/null
+++ b/crates/nano-arrow/src/array/equal/struct_.rs
@@ -0,0 +1,54 @@
+use crate::array::{Array, StructArray};
+
+pub(super) fn equal(lhs: &StructArray, rhs: &StructArray) -> bool {
+    lhs.data_type() == rhs.data_type()
+        && lhs.len() == rhs.len()
+        && match (lhs.validity(), rhs.validity()) {
+            (None, None) => lhs.values().iter().eq(rhs.values().iter()),
+            (Some(l_validity), Some(r_validity)) => lhs
+                .values()
+                .iter()
+                .zip(rhs.values().iter())
+                .all(|(lhs, rhs)| {
+                    l_validity.iter().zip(r_validity.iter()).enumerate().all(
+                        |(i, (lhs_is_valid, rhs_is_valid))| {
+                            if lhs_is_valid && rhs_is_valid {
+                                lhs.sliced(i, 1) == rhs.sliced(i, 1)
+                            } else {
+                                lhs_is_valid == rhs_is_valid
+                            }
+                        },
+                    )
+                }),
+            (Some(l_validity), None) => {
+                lhs.values()
+                    .iter()
+                    .zip(rhs.values().iter())
+                    .all(|(lhs, rhs)| {
+                        l_validity.iter().enumerate().all(|(i, lhs_is_valid)| {
+                            if lhs_is_valid {
+                                lhs.sliced(i, 1) == rhs.sliced(i, 1)
+                            } else {
+                                // rhs is always valid => different
+                                false
+                            }
+                        })
+                    })
+            },
+            (None, Some(r_validity)) => {
+                lhs.values()
+                    .iter()
+                    .zip(rhs.values().iter())
+                    .all(|(lhs, rhs)| {
+                        r_validity.iter().enumerate().all(|(i, rhs_is_valid)| {
+                            if rhs_is_valid {
+                                lhs.sliced(i, 1) == rhs.sliced(i, 1)
+                            } else {
+                                // lhs is always valid => different
+                                false
+                            }
+                        })
+                    })
+            },
+        }
+}
diff --git a/crates/nano-arrow/src/array/equal/union.rs b/crates/nano-arrow/src/array/equal/union.rs
new file mode 100644
index 000000000000..51b9d960feac
--- /dev/null
+++ b/crates/nano-arrow/src/array/equal/union.rs
@@ -0,0 +1,5 @@
+use crate::array::{Array, UnionArray};
+
+pub(super) fn equal(lhs: &UnionArray, rhs: &UnionArray) -> bool {
+    lhs.data_type() == rhs.data_type() && lhs.len() == rhs.len() && lhs.iter().eq(rhs.iter())
+}
diff --git a/crates/nano-arrow/src/array/equal/utf8.rs b/crates/nano-arrow/src/array/equal/utf8.rs
new file mode 100644
index 000000000000..1327221ca331
--- /dev/null
+++ b/crates/nano-arrow/src/array/equal/utf8.rs
@@ -0,0 +1,6 @@
+use crate::array::Utf8Array;
+use crate::offset::Offset;
+
+pub(super) fn equal<O: Offset>(lhs: &Utf8Array<O>, rhs: &Utf8Array<O>) -> bool {
+    lhs.data_type() == rhs.data_type() && lhs.len() == rhs.len() && lhs.iter().eq(rhs.iter())
+}
diff --git a/crates/nano-arrow/src/array/ffi.rs b/crates/nano-arrow/src/array/ffi.rs
new file mode 100644
index 000000000000..0e9629d4fdf0
--- /dev/null
+++ b/crates/nano-arrow/src/array/ffi.rs
@@ -0,0 +1,86 @@
+use crate::array::*;
+use crate::datatypes::PhysicalType;
+use crate::error::Result;
+use crate::ffi;
+
+/// Trait describing how a struct presents itself to the
+/// [C data interface](https://arrow.apache.org/docs/format/CDataInterface.html) (FFI).
+/// # Safety
+/// Implementing this trait incorrect will lead to UB
+pub(crate) unsafe trait ToFfi {
+    /// The pointers to the buffers.
+    fn buffers(&self) -> Vec<Option<*const u8>>;
+
+    /// The children
+    fn children(&self) -> Vec<Box<dyn Array>> {
+        vec![]
+    }
+
+    /// The offset
+    fn offset(&self) -> Option<usize>;
+
+    /// return a partial clone of self with an offset.
+    fn to_ffi_aligned(&self) -> Self;
+}
+
+/// Trait describing how a struct imports into itself from the
+/// [C data interface](https://arrow.apache.org/docs/format/CDataInterface.html) (FFI).
+pub(crate) trait FromFfi<T: ffi::ArrowArrayRef>: Sized {
+    /// Convert itself from FFI.
+    /// # Safety
+    /// This function is intrinsically `unsafe` as it requires the FFI to be made according
+    /// to the [C data interface](https://arrow.apache.org/docs/format/CDataInterface.html)
+    unsafe fn try_from_ffi(array: T) -> Result<Self>;
+}
+
+macro_rules! ffi_dyn {
+    ($array:expr, $ty:ty) => {{
+        let array = $array.as_any().downcast_ref::<$ty>().unwrap();
+        (
+            array.offset().unwrap(),
+            array.buffers(),
+            array.children(),
+            None,
+        )
+    }};
+}
+
+type BuffersChildren = (
+    usize,
+    Vec<Option<*const u8>>,
+    Vec<Box<dyn Array>>,
+    Option<Box<dyn Array>>,
+);
+
+pub fn offset_buffers_children_dictionary(array: &dyn Array) -> BuffersChildren {
+    use PhysicalType::*;
+    match array.data_type().to_physical_type() {
+        Null => ffi_dyn!(array, NullArray),
+        Boolean => ffi_dyn!(array, BooleanArray),
+        Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+            ffi_dyn!(array, PrimitiveArray<$T>)
+        }),
+        Binary => ffi_dyn!(array, BinaryArray<i32>),
+        LargeBinary => ffi_dyn!(array, BinaryArray<i64>),
+        FixedSizeBinary => ffi_dyn!(array, FixedSizeBinaryArray),
+        Utf8 => ffi_dyn!(array, Utf8Array::<i32>),
+        LargeUtf8 => ffi_dyn!(array, Utf8Array::<i64>),
+        List => ffi_dyn!(array, ListArray::<i32>),
+        LargeList => ffi_dyn!(array, ListArray::<i64>),
+        FixedSizeList => ffi_dyn!(array, FixedSizeListArray),
+        Struct => ffi_dyn!(array, StructArray),
+        Union => ffi_dyn!(array, UnionArray),
+        Map => ffi_dyn!(array, MapArray),
+        Dictionary(key_type) => {
+            match_integer_type!(key_type, |$T| {
+                let array = array.as_any().downcast_ref::<DictionaryArray<$T>>().unwrap();
+                (
+                    array.offset().unwrap(),
+                    array.buffers(),
+                    array.children(),
+                    Some(array.values().clone()),
+                )
+            })
+        },
+    }
+}
diff --git a/crates/nano-arrow/src/array/fixed_size_binary/data.rs b/crates/nano-arrow/src/array/fixed_size_binary/data.rs
new file mode 100644
index 000000000000..6eb025d91623
--- /dev/null
+++ b/crates/nano-arrow/src/array/fixed_size_binary/data.rs
@@ -0,0 +1,37 @@
+use arrow_data::{ArrayData, ArrayDataBuilder};
+
+use crate::array::{Arrow2Arrow, FixedSizeBinaryArray};
+use crate::bitmap::Bitmap;
+use crate::buffer::Buffer;
+use crate::datatypes::DataType;
+
+impl Arrow2Arrow for FixedSizeBinaryArray {
+    fn to_data(&self) -> ArrayData {
+        let data_type = self.data_type.clone().into();
+        let builder = ArrayDataBuilder::new(data_type)
+            .len(self.len())
+            .buffers(vec![self.values.clone().into()])
+            .nulls(self.validity.as_ref().map(|b| b.clone().into()));
+
+        // Safety: Array is valid
+        unsafe { builder.build_unchecked() }
+    }
+
+    fn from_data(data: &ArrayData) -> Self {
+        let data_type: DataType = data.data_type().clone().into();
+        let size = match data_type {
+            DataType::FixedSizeBinary(size) => size,
+            _ => unreachable!("must be FixedSizeBinary"),
+        };
+
+        let mut values: Buffer<u8> = data.buffers()[0].clone().into();
+        values.slice(data.offset() * size, data.len() * size);
+
+        Self {
+            size,
+            data_type,
+            values,
+            validity: data.nulls().map(|n| Bitmap::from_null_buffer(n.clone())),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/array/fixed_size_binary/ffi.rs b/crates/nano-arrow/src/array/fixed_size_binary/ffi.rs
new file mode 100644
index 000000000000..ee6e6a030df0
--- /dev/null
+++ b/crates/nano-arrow/src/array/fixed_size_binary/ffi.rs
@@ -0,0 +1,56 @@
+use super::FixedSizeBinaryArray;
+use crate::array::{FromFfi, ToFfi};
+use crate::bitmap::align;
+use crate::error::Result;
+use crate::ffi;
+
+unsafe impl ToFfi for FixedSizeBinaryArray {
+    fn buffers(&self) -> Vec<Option<*const u8>> {
+        vec![
+            self.validity.as_ref().map(|x| x.as_ptr()),
+            Some(self.values.as_ptr().cast::<u8>()),
+        ]
+    }
+
+    fn offset(&self) -> Option<usize> {
+        let offset = self.values.offset() / self.size;
+        if let Some(bitmap) = self.validity.as_ref() {
+            if bitmap.offset() == offset {
+                Some(offset)
+            } else {
+                None
+            }
+        } else {
+            Some(offset)
+        }
+    }
+
+    fn to_ffi_aligned(&self) -> Self {
+        let offset = self.values.offset() / self.size;
+
+        let validity = self.validity.as_ref().map(|bitmap| {
+            if bitmap.offset() == offset {
+                bitmap.clone()
+            } else {
+                align(bitmap, offset)
+            }
+        });
+
+        Self {
+            size: self.size,
+            data_type: self.data_type.clone(),
+            validity,
+            values: self.values.clone(),
+        }
+    }
+}
+
+impl<A: ffi::ArrowArrayRef> FromFfi<A> for FixedSizeBinaryArray {
+    unsafe fn try_from_ffi(array: A) -> Result<Self> {
+        let data_type = array.data_type().clone();
+        let validity = unsafe { array.validity() }?;
+        let values = unsafe { array.buffer::<u8>(1) }?;
+
+        Self::try_new(data_type, values, validity)
+    }
+}
diff --git a/crates/nano-arrow/src/array/fixed_size_binary/fmt.rs b/crates/nano-arrow/src/array/fixed_size_binary/fmt.rs
new file mode 100644
index 000000000000..c5f9e2dd3293
--- /dev/null
+++ b/crates/nano-arrow/src/array/fixed_size_binary/fmt.rs
@@ -0,0 +1,20 @@
+use std::fmt::{Debug, Formatter, Result, Write};
+
+use super::super::fmt::write_vec;
+use super::FixedSizeBinaryArray;
+
+pub fn write_value<W: Write>(array: &FixedSizeBinaryArray, index: usize, f: &mut W) -> Result {
+    let values = array.value(index);
+    let writer = |f: &mut W, index| write!(f, "{}", values[index]);
+
+    write_vec(f, writer, None, values.len(), "None", false)
+}
+
+impl Debug for FixedSizeBinaryArray {
+    fn fmt(&self, f: &mut Formatter<'_>) -> Result {
+        let writer = |f: &mut Formatter, index| write_value(self, index, f);
+
+        write!(f, "{:?}", self.data_type)?;
+        write_vec(f, writer, self.validity(), self.len(), "None", false)
+    }
+}
diff --git a/crates/nano-arrow/src/array/fixed_size_binary/iterator.rs b/crates/nano-arrow/src/array/fixed_size_binary/iterator.rs
new file mode 100644
index 000000000000..4c885c591943
--- /dev/null
+++ b/crates/nano-arrow/src/array/fixed_size_binary/iterator.rs
@@ -0,0 +1,49 @@
+use super::{FixedSizeBinaryArray, MutableFixedSizeBinaryArray};
+use crate::array::MutableArray;
+use crate::bitmap::utils::{BitmapIter, ZipValidity};
+
+impl<'a> IntoIterator for &'a FixedSizeBinaryArray {
+    type Item = Option<&'a [u8]>;
+    type IntoIter = ZipValidity<&'a [u8], std::slice::ChunksExact<'a, u8>, BitmapIter<'a>>;
+
+    fn into_iter(self) -> Self::IntoIter {
+        self.iter()
+    }
+}
+
+impl<'a> FixedSizeBinaryArray {
+    /// constructs a new iterator
+    pub fn iter(
+        &'a self,
+    ) -> ZipValidity<&'a [u8], std::slice::ChunksExact<'a, u8>, BitmapIter<'a>> {
+        ZipValidity::new_with_validity(self.values_iter(), self.validity())
+    }
+
+    /// Returns iterator over the values of [`FixedSizeBinaryArray`]
+    pub fn values_iter(&'a self) -> std::slice::ChunksExact<'a, u8> {
+        self.values().chunks_exact(self.size)
+    }
+}
+
+impl<'a> IntoIterator for &'a MutableFixedSizeBinaryArray {
+    type Item = Option<&'a [u8]>;
+    type IntoIter = ZipValidity<&'a [u8], std::slice::ChunksExact<'a, u8>, BitmapIter<'a>>;
+
+    fn into_iter(self) -> Self::IntoIter {
+        self.iter()
+    }
+}
+
+impl<'a> MutableFixedSizeBinaryArray {
+    /// constructs a new iterator
+    pub fn iter(
+        &'a self,
+    ) -> ZipValidity<&'a [u8], std::slice::ChunksExact<'a, u8>, BitmapIter<'a>> {
+        ZipValidity::new(self.iter_values(), self.validity().map(|x| x.iter()))
+    }
+
+    /// Returns iterator over the values of [`MutableFixedSizeBinaryArray`]
+    pub fn iter_values(&'a self) -> std::slice::ChunksExact<'a, u8> {
+        self.values().chunks_exact(self.size())
+    }
+}
diff --git a/crates/nano-arrow/src/array/fixed_size_binary/mod.rs b/crates/nano-arrow/src/array/fixed_size_binary/mod.rs
new file mode 100644
index 000000000000..f7f82c0a3ef0
--- /dev/null
+++ b/crates/nano-arrow/src/array/fixed_size_binary/mod.rs
@@ -0,0 +1,286 @@
+use super::Array;
+use crate::bitmap::Bitmap;
+use crate::buffer::Buffer;
+use crate::datatypes::DataType;
+use crate::error::Error;
+
+#[cfg(feature = "arrow")]
+mod data;
+mod ffi;
+pub(super) mod fmt;
+mod iterator;
+mod mutable;
+pub use mutable::*;
+
+/// The Arrow's equivalent to an immutable `Vec<Option<[u8; size]>>`.
+/// Cloning and slicing this struct is `O(1)`.
+#[derive(Clone)]
+pub struct FixedSizeBinaryArray {
+    size: usize, // this is redundant with `data_type`, but useful to not have to deconstruct the data_type.
+    data_type: DataType,
+    values: Buffer<u8>,
+    validity: Option<Bitmap>,
+}
+
+impl FixedSizeBinaryArray {
+    /// Creates a new [`FixedSizeBinaryArray`].
+    ///
+    /// # Errors
+    /// This function returns an error iff:
+    /// * The `data_type`'s physical type is not [`crate::datatypes::PhysicalType::FixedSizeBinary`]
+    /// * The length of `values` is not a multiple of `size` in `data_type`
+    /// * the validity's length is not equal to `values.len() / size`.
+    pub fn try_new(
+        data_type: DataType,
+        values: Buffer<u8>,
+        validity: Option<Bitmap>,
+    ) -> Result<Self, Error> {
+        let size = Self::maybe_get_size(&data_type)?;
+
+        if values.len() % size != 0 {
+            return Err(Error::oos(format!(
+                "values (of len {}) must be a multiple of size ({}) in FixedSizeBinaryArray.",
+                values.len(),
+                size
+            )));
+        }
+        let len = values.len() / size;
+
+        if validity
+            .as_ref()
+            .map_or(false, |validity| validity.len() != len)
+        {
+            return Err(Error::oos(
+                "validity mask length must be equal to the number of values divided by size",
+            ));
+        }
+
+        Ok(Self {
+            size,
+            data_type,
+            values,
+            validity,
+        })
+    }
+
+    /// Creates a new [`FixedSizeBinaryArray`].
+    /// # Panics
+    /// This function panics iff:
+    /// * The `data_type`'s physical type is not [`crate::datatypes::PhysicalType::FixedSizeBinary`]
+    /// * The length of `values` is not a multiple of `size` in `data_type`
+    /// * the validity's length is not equal to `values.len() / size`.
+    pub fn new(data_type: DataType, values: Buffer<u8>, validity: Option<Bitmap>) -> Self {
+        Self::try_new(data_type, values, validity).unwrap()
+    }
+
+    /// Returns a new empty [`FixedSizeBinaryArray`].
+    pub fn new_empty(data_type: DataType) -> Self {
+        Self::new(data_type, Buffer::new(), None)
+    }
+
+    /// Returns a new null [`FixedSizeBinaryArray`].
+    pub fn new_null(data_type: DataType, length: usize) -> Self {
+        let size = Self::maybe_get_size(&data_type).unwrap();
+        Self::new(
+            data_type,
+            vec![0u8; length * size].into(),
+            Some(Bitmap::new_zeroed(length)),
+        )
+    }
+}
+
+// must use
+impl FixedSizeBinaryArray {
+    /// Slices this [`FixedSizeBinaryArray`].
+    /// # Implementation
+    /// This operation is `O(1)`.
+    /// # Panics
+    /// panics iff `offset + length > self.len()`
+    pub fn slice(&mut self, offset: usize, length: usize) {
+        assert!(
+            offset + length <= self.len(),
+            "the offset of the new Buffer cannot exceed the existing length"
+        );
+        unsafe { self.slice_unchecked(offset, length) }
+    }
+
+    /// Slices this [`FixedSizeBinaryArray`].
+    /// # Implementation
+    /// This operation is `O(1)`.
+    /// # Safety
+    /// The caller must ensure that `offset + length <= self.len()`.
+    pub unsafe fn slice_unchecked(&mut self, offset: usize, length: usize) {
+        self.validity.as_mut().and_then(|bitmap| {
+            bitmap.slice_unchecked(offset, length);
+            (bitmap.unset_bits() > 0).then(|| bitmap)
+        });
+        self.values
+            .slice_unchecked(offset * self.size, length * self.size);
+    }
+
+    impl_sliced!();
+    impl_mut_validity!();
+    impl_into_array!();
+}
+
+// accessors
+impl FixedSizeBinaryArray {
+    /// Returns the length of this array
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.values.len() / self.size
+    }
+
+    /// The optional validity.
+    #[inline]
+    pub fn validity(&self) -> Option<&Bitmap> {
+        self.validity.as_ref()
+    }
+
+    /// Returns the values allocated on this [`FixedSizeBinaryArray`].
+    pub fn values(&self) -> &Buffer<u8> {
+        &self.values
+    }
+
+    /// Returns value at position `i`.
+    /// # Panic
+    /// Panics iff `i >= self.len()`.
+    #[inline]
+    pub fn value(&self, i: usize) -> &[u8] {
+        assert!(i < self.len());
+        unsafe { self.value_unchecked(i) }
+    }
+
+    /// Returns the element at index `i` as &str
+    /// # Safety
+    /// Assumes that the `i < self.len`.
+    #[inline]
+    pub unsafe fn value_unchecked(&self, i: usize) -> &[u8] {
+        // soundness: invariant of the function.
+        self.values
+            .get_unchecked(i * self.size..(i + 1) * self.size)
+    }
+
+    /// Returns the element at index `i` or `None` if it is null
+    /// # Panics
+    /// iff `i >= self.len()`
+    #[inline]
+    pub fn get(&self, i: usize) -> Option<&[u8]> {
+        if !self.is_null(i) {
+            // soundness: Array::is_null panics if i >= self.len
+            unsafe { Some(self.value_unchecked(i)) }
+        } else {
+            None
+        }
+    }
+
+    /// Returns a new [`FixedSizeBinaryArray`] with a different logical type.
+    /// This is `O(1)`.
+    /// # Panics
+    /// Panics iff the data_type is not supported for the physical type.
+    #[inline]
+    pub fn to(self, data_type: DataType) -> Self {
+        match (
+            data_type.to_logical_type(),
+            self.data_type().to_logical_type(),
+        ) {
+            (DataType::FixedSizeBinary(size_a), DataType::FixedSizeBinary(size_b))
+                if size_a == size_b => {},
+            _ => panic!("Wrong DataType"),
+        }
+
+        Self {
+            size: self.size,
+            data_type,
+            values: self.values,
+            validity: self.validity,
+        }
+    }
+
+    /// Returns the size
+    pub fn size(&self) -> usize {
+        self.size
+    }
+}
+
+impl FixedSizeBinaryArray {
+    pub(crate) fn maybe_get_size(data_type: &DataType) -> Result<usize, Error> {
+        match data_type.to_logical_type() {
+            DataType::FixedSizeBinary(size) => {
+                if *size == 0 {
+                    return Err(Error::oos("FixedSizeBinaryArray expects a positive size"));
+                }
+                Ok(*size)
+            },
+            _ => Err(Error::oos(
+                "FixedSizeBinaryArray expects DataType::FixedSizeBinary",
+            )),
+        }
+    }
+
+    pub(crate) fn get_size(data_type: &DataType) -> usize {
+        Self::maybe_get_size(data_type).unwrap()
+    }
+}
+
+impl Array for FixedSizeBinaryArray {
+    impl_common_array!();
+
+    fn validity(&self) -> Option<&Bitmap> {
+        self.validity.as_ref()
+    }
+
+    #[inline]
+    fn with_validity(&self, validity: Option<Bitmap>) -> Box<dyn Array> {
+        Box::new(self.clone().with_validity(validity))
+    }
+}
+
+impl FixedSizeBinaryArray {
+    /// Creates a [`FixedSizeBinaryArray`] from an fallible iterator of optional `[u8]`.
+    pub fn try_from_iter<P: AsRef<[u8]>, I: IntoIterator<Item = Option<P>>>(
+        iter: I,
+        size: usize,
+    ) -> Result<Self, Error> {
+        MutableFixedSizeBinaryArray::try_from_iter(iter, size).map(|x| x.into())
+    }
+
+    /// Creates a [`FixedSizeBinaryArray`] from an iterator of optional `[u8]`.
+    pub fn from_iter<P: AsRef<[u8]>, I: IntoIterator<Item = Option<P>>>(
+        iter: I,
+        size: usize,
+    ) -> Self {
+        MutableFixedSizeBinaryArray::try_from_iter(iter, size)
+            .unwrap()
+            .into()
+    }
+
+    /// Creates a [`FixedSizeBinaryArray`] from a slice of arrays of bytes
+    pub fn from_slice<const N: usize, P: AsRef<[[u8; N]]>>(a: P) -> Self {
+        let values = a.as_ref().iter().flatten().copied().collect::<Vec<_>>();
+        Self::new(DataType::FixedSizeBinary(N), values.into(), None)
+    }
+
+    /// Creates a new [`FixedSizeBinaryArray`] from a slice of optional `[u8]`.
+    // Note: this can't be `impl From` because Rust does not allow double `AsRef` on it.
+    pub fn from<const N: usize, P: AsRef<[Option<[u8; N]>]>>(slice: P) -> Self {
+        MutableFixedSizeBinaryArray::from(slice).into()
+    }
+}
+
+pub trait FixedSizeBinaryValues {
+    fn values(&self) -> &[u8];
+    fn size(&self) -> usize;
+}
+
+impl FixedSizeBinaryValues for FixedSizeBinaryArray {
+    #[inline]
+    fn values(&self) -> &[u8] {
+        &self.values
+    }
+
+    #[inline]
+    fn size(&self) -> usize {
+        self.size
+    }
+}
diff --git a/crates/nano-arrow/src/array/fixed_size_binary/mutable.rs b/crates/nano-arrow/src/array/fixed_size_binary/mutable.rs
new file mode 100644
index 000000000000..f5a68facf681
--- /dev/null
+++ b/crates/nano-arrow/src/array/fixed_size_binary/mutable.rs
@@ -0,0 +1,321 @@
+use std::sync::Arc;
+
+use super::{FixedSizeBinaryArray, FixedSizeBinaryValues};
+use crate::array::physical_binary::extend_validity;
+use crate::array::{Array, MutableArray, TryExtendFromSelf};
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::DataType;
+use crate::error::Error;
+
+/// The Arrow's equivalent to a mutable `Vec<Option<[u8; size]>>`.
+/// Converting a [`MutableFixedSizeBinaryArray`] into a [`FixedSizeBinaryArray`] is `O(1)`.
+/// # Implementation
+/// This struct does not allocate a validity until one is required (i.e. push a null to it).
+#[derive(Debug, Clone)]
+pub struct MutableFixedSizeBinaryArray {
+    data_type: DataType,
+    size: usize,
+    values: Vec<u8>,
+    validity: Option<MutableBitmap>,
+}
+
+impl From<MutableFixedSizeBinaryArray> for FixedSizeBinaryArray {
+    fn from(other: MutableFixedSizeBinaryArray) -> Self {
+        FixedSizeBinaryArray::new(
+            other.data_type,
+            other.values.into(),
+            other.validity.map(|x| x.into()),
+        )
+    }
+}
+
+impl MutableFixedSizeBinaryArray {
+    /// Creates a new [`MutableFixedSizeBinaryArray`].
+    ///
+    /// # Errors
+    /// This function returns an error iff:
+    /// * The `data_type`'s physical type is not [`crate::datatypes::PhysicalType::FixedSizeBinary`]
+    /// * The length of `values` is not a multiple of `size` in `data_type`
+    /// * the validity's length is not equal to `values.len() / size`.
+    pub fn try_new(
+        data_type: DataType,
+        values: Vec<u8>,
+        validity: Option<MutableBitmap>,
+    ) -> Result<Self, Error> {
+        let size = FixedSizeBinaryArray::maybe_get_size(&data_type)?;
+
+        if values.len() % size != 0 {
+            return Err(Error::oos(format!(
+                "values (of len {}) must be a multiple of size ({}) in FixedSizeBinaryArray.",
+                values.len(),
+                size
+            )));
+        }
+        let len = values.len() / size;
+
+        if validity
+            .as_ref()
+            .map_or(false, |validity| validity.len() != len)
+        {
+            return Err(Error::oos(
+                "validity mask length must be equal to the number of values divided by size",
+            ));
+        }
+
+        Ok(Self {
+            size,
+            data_type,
+            values,
+            validity,
+        })
+    }
+
+    /// Creates a new empty [`MutableFixedSizeBinaryArray`].
+    pub fn new(size: usize) -> Self {
+        Self::with_capacity(size, 0)
+    }
+
+    /// Creates a new [`MutableFixedSizeBinaryArray`] with capacity for `capacity` entries.
+    pub fn with_capacity(size: usize, capacity: usize) -> Self {
+        Self::try_new(
+            DataType::FixedSizeBinary(size),
+            Vec::<u8>::with_capacity(capacity * size),
+            None,
+        )
+        .unwrap()
+    }
+
+    /// Creates a new [`MutableFixedSizeBinaryArray`] from a slice of optional `[u8]`.
+    // Note: this can't be `impl From` because Rust does not allow double `AsRef` on it.
+    pub fn from<const N: usize, P: AsRef<[Option<[u8; N]>]>>(slice: P) -> Self {
+        let values = slice
+            .as_ref()
+            .iter()
+            .copied()
+            .flat_map(|x| x.unwrap_or([0; N]))
+            .collect::<Vec<_>>();
+        let validity = slice
+            .as_ref()
+            .iter()
+            .map(|x| x.is_some())
+            .collect::<MutableBitmap>();
+        Self::try_new(DataType::FixedSizeBinary(N), values, validity.into()).unwrap()
+    }
+
+    /// tries to push a new entry to [`MutableFixedSizeBinaryArray`].
+    /// # Error
+    /// Errors iff the size of `value` is not equal to its own size.
+    #[inline]
+    pub fn try_push<P: AsRef<[u8]>>(&mut self, value: Option<P>) -> Result<(), Error> {
+        match value {
+            Some(bytes) => {
+                let bytes = bytes.as_ref();
+                if self.size != bytes.len() {
+                    return Err(Error::InvalidArgumentError(
+                        "FixedSizeBinaryArray requires every item to be of its length".to_string(),
+                    ));
+                }
+                self.values.extend_from_slice(bytes);
+
+                match &mut self.validity {
+                    Some(validity) => validity.push(true),
+                    None => {},
+                }
+            },
+            None => {
+                self.values.resize(self.values.len() + self.size, 0);
+                match &mut self.validity {
+                    Some(validity) => validity.push(false),
+                    None => self.init_validity(),
+                }
+            },
+        }
+        Ok(())
+    }
+
+    /// pushes a new entry to [`MutableFixedSizeBinaryArray`].
+    /// # Panics
+    /// Panics iff the size of `value` is not equal to its own size.
+    #[inline]
+    pub fn push<P: AsRef<[u8]>>(&mut self, value: Option<P>) {
+        self.try_push(value).unwrap()
+    }
+
+    /// Returns the length of this array
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.values.len() / self.size
+    }
+
+    /// Pop the last entry from [`MutableFixedSizeBinaryArray`].
+    /// This function returns `None` iff this array is empty
+    pub fn pop(&mut self) -> Option<Vec<u8>> {
+        if self.values.len() < self.size {
+            return None;
+        }
+        let value_start = self.values.len() - self.size;
+        let value = self.values.split_off(value_start);
+        self.validity
+            .as_mut()
+            .map(|x| x.pop()?.then(|| ()))
+            .unwrap_or_else(|| Some(()))
+            .map(|_| value)
+    }
+
+    /// Creates a new [`MutableFixedSizeBinaryArray`] from an iterator of values.
+    /// # Errors
+    /// Errors iff the size of any of the `value` is not equal to its own size.
+    pub fn try_from_iter<P: AsRef<[u8]>, I: IntoIterator<Item = Option<P>>>(
+        iter: I,
+        size: usize,
+    ) -> Result<Self, Error> {
+        let iterator = iter.into_iter();
+        let (lower, _) = iterator.size_hint();
+        let mut primitive = Self::with_capacity(size, lower);
+        for item in iterator {
+            primitive.try_push(item)?
+        }
+        Ok(primitive)
+    }
+
+    /// returns the (fixed) size of the [`MutableFixedSizeBinaryArray`].
+    #[inline]
+    pub fn size(&self) -> usize {
+        self.size
+    }
+
+    /// Returns the capacity of this array
+    pub fn capacity(&self) -> usize {
+        self.values.capacity() / self.size
+    }
+
+    fn init_validity(&mut self) {
+        let mut validity = MutableBitmap::new();
+        validity.extend_constant(self.len(), true);
+        validity.set(self.len() - 1, false);
+        self.validity = Some(validity)
+    }
+
+    /// Returns the element at index `i` as `&[u8]`
+    #[inline]
+    pub fn value(&self, i: usize) -> &[u8] {
+        &self.values[i * self.size..(i + 1) * self.size]
+    }
+
+    /// Returns the element at index `i` as `&[u8]`
+    /// # Safety
+    /// Assumes that the `i < self.len`.
+    #[inline]
+    pub unsafe fn value_unchecked(&self, i: usize) -> &[u8] {
+        std::slice::from_raw_parts(self.values.as_ptr().add(i * self.size), self.size)
+    }
+
+    /// Reserves `additional` slots.
+    pub fn reserve(&mut self, additional: usize) {
+        self.values.reserve(additional * self.size);
+        if let Some(x) = self.validity.as_mut() {
+            x.reserve(additional)
+        }
+    }
+
+    /// Shrinks the capacity of the [`MutableFixedSizeBinaryArray`] to fit its current length.
+    pub fn shrink_to_fit(&mut self) {
+        self.values.shrink_to_fit();
+        if let Some(validity) = &mut self.validity {
+            validity.shrink_to_fit()
+        }
+    }
+}
+
+/// Accessors
+impl MutableFixedSizeBinaryArray {
+    /// Returns its values.
+    pub fn values(&self) -> &Vec<u8> {
+        &self.values
+    }
+
+    /// Returns a mutable slice of values.
+    pub fn values_mut_slice(&mut self) -> &mut [u8] {
+        self.values.as_mut_slice()
+    }
+}
+
+impl MutableArray for MutableFixedSizeBinaryArray {
+    fn len(&self) -> usize {
+        self.values.len() / self.size
+    }
+
+    fn validity(&self) -> Option<&MutableBitmap> {
+        self.validity.as_ref()
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        FixedSizeBinaryArray::new(
+            DataType::FixedSizeBinary(self.size),
+            std::mem::take(&mut self.values).into(),
+            std::mem::take(&mut self.validity).map(|x| x.into()),
+        )
+        .boxed()
+    }
+
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        FixedSizeBinaryArray::new(
+            DataType::FixedSizeBinary(self.size),
+            std::mem::take(&mut self.values).into(),
+            std::mem::take(&mut self.validity).map(|x| x.into()),
+        )
+        .arced()
+    }
+
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    fn as_mut_any(&mut self) -> &mut dyn std::any::Any {
+        self
+    }
+
+    fn push_null(&mut self) {
+        self.push::<&[u8]>(None);
+    }
+
+    fn reserve(&mut self, additional: usize) {
+        self.reserve(additional)
+    }
+
+    fn shrink_to_fit(&mut self) {
+        self.shrink_to_fit()
+    }
+}
+
+impl FixedSizeBinaryValues for MutableFixedSizeBinaryArray {
+    #[inline]
+    fn values(&self) -> &[u8] {
+        &self.values
+    }
+
+    #[inline]
+    fn size(&self) -> usize {
+        self.size
+    }
+}
+
+impl PartialEq for MutableFixedSizeBinaryArray {
+    fn eq(&self, other: &Self) -> bool {
+        self.iter().eq(other.iter())
+    }
+}
+
+impl TryExtendFromSelf for MutableFixedSizeBinaryArray {
+    fn try_extend_from_self(&mut self, other: &Self) -> Result<(), Error> {
+        extend_validity(self.len(), &mut self.validity, &other.validity);
+
+        let slice = other.values.as_slice();
+        self.values.extend_from_slice(slice);
+        Ok(())
+    }
+}
diff --git a/crates/nano-arrow/src/array/fixed_size_list/data.rs b/crates/nano-arrow/src/array/fixed_size_list/data.rs
new file mode 100644
index 000000000000..966504bf3b6c
--- /dev/null
+++ b/crates/nano-arrow/src/array/fixed_size_list/data.rs
@@ -0,0 +1,36 @@
+use arrow_data::{ArrayData, ArrayDataBuilder};
+
+use crate::array::{from_data, to_data, Arrow2Arrow, FixedSizeListArray};
+use crate::bitmap::Bitmap;
+use crate::datatypes::DataType;
+
+impl Arrow2Arrow for FixedSizeListArray {
+    fn to_data(&self) -> ArrayData {
+        let data_type = self.data_type.clone().into();
+        let builder = ArrayDataBuilder::new(data_type)
+            .len(self.len())
+            .nulls(self.validity.as_ref().map(|b| b.clone().into()))
+            .child_data(vec![to_data(self.values.as_ref())]);
+
+        // Safety: Array is valid
+        unsafe { builder.build_unchecked() }
+    }
+
+    fn from_data(data: &ArrayData) -> Self {
+        let data_type: DataType = data.data_type().clone().into();
+        let size = match data_type {
+            DataType::FixedSizeList(_, size) => size,
+            _ => unreachable!("must be FixedSizeList type"),
+        };
+
+        let mut values = from_data(&data.child_data()[0]);
+        values.slice(data.offset() * size, data.len() * size);
+
+        Self {
+            size,
+            data_type,
+            values,
+            validity: data.nulls().map(|n| Bitmap::from_null_buffer(n.clone())),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/array/fixed_size_list/ffi.rs b/crates/nano-arrow/src/array/fixed_size_list/ffi.rs
new file mode 100644
index 000000000000..237001809598
--- /dev/null
+++ b/crates/nano-arrow/src/array/fixed_size_list/ffi.rs
@@ -0,0 +1,39 @@
+use super::FixedSizeListArray;
+use crate::array::ffi::{FromFfi, ToFfi};
+use crate::array::Array;
+use crate::error::Result;
+use crate::ffi;
+
+unsafe impl ToFfi for FixedSizeListArray {
+    fn buffers(&self) -> Vec<Option<*const u8>> {
+        vec![self.validity.as_ref().map(|x| x.as_ptr())]
+    }
+
+    fn children(&self) -> Vec<Box<dyn Array>> {
+        vec![self.values.clone()]
+    }
+
+    fn offset(&self) -> Option<usize> {
+        Some(
+            self.validity
+                .as_ref()
+                .map(|bitmap| bitmap.offset())
+                .unwrap_or_default(),
+        )
+    }
+
+    fn to_ffi_aligned(&self) -> Self {
+        self.clone()
+    }
+}
+
+impl<A: ffi::ArrowArrayRef> FromFfi<A> for FixedSizeListArray {
+    unsafe fn try_from_ffi(array: A) -> Result<Self> {
+        let data_type = array.data_type().clone();
+        let validity = unsafe { array.validity() }?;
+        let child = unsafe { array.child(0)? };
+        let values = ffi::try_from(child)?;
+
+        Self::try_new(data_type, values, validity)
+    }
+}
diff --git a/crates/nano-arrow/src/array/fixed_size_list/fmt.rs b/crates/nano-arrow/src/array/fixed_size_list/fmt.rs
new file mode 100644
index 000000000000..ee7d86115a14
--- /dev/null
+++ b/crates/nano-arrow/src/array/fixed_size_list/fmt.rs
@@ -0,0 +1,24 @@
+use std::fmt::{Debug, Formatter, Result, Write};
+
+use super::super::fmt::{get_display, write_vec};
+use super::FixedSizeListArray;
+
+pub fn write_value<W: Write>(
+    array: &FixedSizeListArray,
+    index: usize,
+    null: &'static str,
+    f: &mut W,
+) -> Result {
+    let values = array.value(index);
+    let writer = |f: &mut W, index| get_display(values.as_ref(), null)(f, index);
+    write_vec(f, writer, None, values.len(), null, false)
+}
+
+impl Debug for FixedSizeListArray {
+    fn fmt(&self, f: &mut Formatter<'_>) -> Result {
+        let writer = |f: &mut Formatter, index| write_value(self, index, "None", f);
+
+        write!(f, "FixedSizeListArray")?;
+        write_vec(f, writer, self.validity(), self.len(), "None", false)
+    }
+}
diff --git a/crates/nano-arrow/src/array/fixed_size_list/iterator.rs b/crates/nano-arrow/src/array/fixed_size_list/iterator.rs
new file mode 100644
index 000000000000..123658005adc
--- /dev/null
+++ b/crates/nano-arrow/src/array/fixed_size_list/iterator.rs
@@ -0,0 +1,43 @@
+use super::FixedSizeListArray;
+use crate::array::{Array, ArrayAccessor, ArrayValuesIter};
+use crate::bitmap::utils::{BitmapIter, ZipValidity};
+
+unsafe impl<'a> ArrayAccessor<'a> for FixedSizeListArray {
+    type Item = Box<dyn Array>;
+
+    #[inline]
+    unsafe fn value_unchecked(&'a self, index: usize) -> Self::Item {
+        self.value_unchecked(index)
+    }
+
+    #[inline]
+    fn len(&self) -> usize {
+        self.len()
+    }
+}
+
+/// Iterator of values of a [`FixedSizeListArray`].
+pub type FixedSizeListValuesIter<'a> = ArrayValuesIter<'a, FixedSizeListArray>;
+
+type ZipIter<'a> = ZipValidity<Box<dyn Array>, FixedSizeListValuesIter<'a>, BitmapIter<'a>>;
+
+impl<'a> IntoIterator for &'a FixedSizeListArray {
+    type Item = Option<Box<dyn Array>>;
+    type IntoIter = ZipIter<'a>;
+
+    fn into_iter(self) -> Self::IntoIter {
+        self.iter()
+    }
+}
+
+impl<'a> FixedSizeListArray {
+    /// Returns an iterator of `Option<Box<dyn Array>>`
+    pub fn iter(&'a self) -> ZipIter<'a> {
+        ZipValidity::new_with_validity(FixedSizeListValuesIter::new(self), self.validity())
+    }
+
+    /// Returns an iterator of `Box<dyn Array>`
+    pub fn values_iter(&'a self) -> FixedSizeListValuesIter<'a> {
+        FixedSizeListValuesIter::new(self)
+    }
+}
diff --git a/crates/nano-arrow/src/array/fixed_size_list/mod.rs b/crates/nano-arrow/src/array/fixed_size_list/mod.rs
new file mode 100644
index 000000000000..25ee0db14874
--- /dev/null
+++ b/crates/nano-arrow/src/array/fixed_size_list/mod.rs
@@ -0,0 +1,220 @@
+use super::{new_empty_array, new_null_array, Array};
+use crate::bitmap::Bitmap;
+use crate::datatypes::{DataType, Field};
+use crate::error::Error;
+
+#[cfg(feature = "arrow")]
+mod data;
+mod ffi;
+pub(super) mod fmt;
+mod iterator;
+pub use iterator::*;
+mod mutable;
+pub use mutable::*;
+
+/// The Arrow's equivalent to an immutable `Vec<Option<[T; size]>>` where `T` is an Arrow type.
+/// Cloning and slicing this struct is `O(1)`.
+#[derive(Clone)]
+pub struct FixedSizeListArray {
+    size: usize, // this is redundant with `data_type`, but useful to not have to deconstruct the data_type.
+    data_type: DataType,
+    values: Box<dyn Array>,
+    validity: Option<Bitmap>,
+}
+
+impl FixedSizeListArray {
+    /// Creates a new [`FixedSizeListArray`].
+    ///
+    /// # Errors
+    /// This function returns an error iff:
+    /// * The `data_type`'s physical type is not [`crate::datatypes::PhysicalType::FixedSizeList`]
+    /// * The `data_type`'s inner field's data type is not equal to `values.data_type`.
+    /// * The length of `values` is not a multiple of `size` in `data_type`
+    /// * the validity's length is not equal to `values.len() / size`.
+    pub fn try_new(
+        data_type: DataType,
+        values: Box<dyn Array>,
+        validity: Option<Bitmap>,
+    ) -> Result<Self, Error> {
+        let (child, size) = Self::try_child_and_size(&data_type)?;
+
+        let child_data_type = &child.data_type;
+        let values_data_type = values.data_type();
+        if child_data_type != values_data_type {
+            return Err(Error::oos(
+                format!("FixedSizeListArray's child's DataType must match. However, the expected DataType is {child_data_type:?} while it got {values_data_type:?}."),
+            ));
+        }
+
+        if values.len() % size != 0 {
+            return Err(Error::oos(format!(
+                "values (of len {}) must be a multiple of size ({}) in FixedSizeListArray.",
+                values.len(),
+                size
+            )));
+        }
+        let len = values.len() / size;
+
+        if validity
+            .as_ref()
+            .map_or(false, |validity| validity.len() != len)
+        {
+            return Err(Error::oos(
+                "validity mask length must be equal to the number of values divided by size",
+            ));
+        }
+
+        Ok(Self {
+            size,
+            data_type,
+            values,
+            validity,
+        })
+    }
+
+    /// Alias to `Self::try_new(...).unwrap()`
+    pub fn new(data_type: DataType, values: Box<dyn Array>, validity: Option<Bitmap>) -> Self {
+        Self::try_new(data_type, values, validity).unwrap()
+    }
+
+    /// Returns the size (number of elements per slot) of this [`FixedSizeListArray`].
+    pub const fn size(&self) -> usize {
+        self.size
+    }
+
+    /// Returns a new empty [`FixedSizeListArray`].
+    pub fn new_empty(data_type: DataType) -> Self {
+        let values = new_empty_array(Self::get_child_and_size(&data_type).0.data_type().clone());
+        Self::new(data_type, values, None)
+    }
+
+    /// Returns a new null [`FixedSizeListArray`].
+    pub fn new_null(data_type: DataType, length: usize) -> Self {
+        let (field, size) = Self::get_child_and_size(&data_type);
+
+        let values = new_null_array(field.data_type().clone(), length * size);
+        Self::new(data_type, values, Some(Bitmap::new_zeroed(length)))
+    }
+}
+
+// must use
+impl FixedSizeListArray {
+    /// Slices this [`FixedSizeListArray`].
+    /// # Implementation
+    /// This operation is `O(1)`.
+    /// # Panics
+    /// panics iff `offset + length > self.len()`
+    pub fn slice(&mut self, offset: usize, length: usize) {
+        assert!(
+            offset + length <= self.len(),
+            "the offset of the new Buffer cannot exceed the existing length"
+        );
+        unsafe { self.slice_unchecked(offset, length) }
+    }
+
+    /// Slices this [`FixedSizeListArray`].
+    /// # Implementation
+    /// This operation is `O(1)`.
+    /// # Safety
+    /// The caller must ensure that `offset + length <= self.len()`.
+    pub unsafe fn slice_unchecked(&mut self, offset: usize, length: usize) {
+        self.validity.as_mut().and_then(|bitmap| {
+            bitmap.slice_unchecked(offset, length);
+            (bitmap.unset_bits() > 0).then(|| bitmap)
+        });
+        self.values
+            .slice_unchecked(offset * self.size, length * self.size);
+    }
+
+    impl_sliced!();
+    impl_mut_validity!();
+    impl_into_array!();
+}
+
+// accessors
+impl FixedSizeListArray {
+    /// Returns the length of this array
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.values.len() / self.size
+    }
+
+    /// The optional validity.
+    #[inline]
+    pub fn validity(&self) -> Option<&Bitmap> {
+        self.validity.as_ref()
+    }
+
+    /// Returns the inner array.
+    pub fn values(&self) -> &Box<dyn Array> {
+        &self.values
+    }
+
+    /// Returns the `Vec<T>` at position `i`.
+    /// # Panic:
+    /// panics iff `i >= self.len()`
+    #[inline]
+    pub fn value(&self, i: usize) -> Box<dyn Array> {
+        self.values.sliced(i * self.size, self.size)
+    }
+
+    /// Returns the `Vec<T>` at position `i`.
+    /// # Safety
+    /// Caller must ensure that `i < self.len()`
+    #[inline]
+    pub unsafe fn value_unchecked(&self, i: usize) -> Box<dyn Array> {
+        self.values.sliced_unchecked(i * self.size, self.size)
+    }
+
+    /// Returns the element at index `i` or `None` if it is null
+    /// # Panics
+    /// iff `i >= self.len()`
+    #[inline]
+    pub fn get(&self, i: usize) -> Option<Box<dyn Array>> {
+        if !self.is_null(i) {
+            // soundness: Array::is_null panics if i >= self.len
+            unsafe { Some(self.value_unchecked(i)) }
+        } else {
+            None
+        }
+    }
+}
+
+impl FixedSizeListArray {
+    pub(crate) fn try_child_and_size(data_type: &DataType) -> Result<(&Field, usize), Error> {
+        match data_type.to_logical_type() {
+            DataType::FixedSizeList(child, size) => {
+                if *size == 0 {
+                    return Err(Error::oos("FixedSizeBinaryArray expects a positive size"));
+                }
+                Ok((child.as_ref(), *size))
+            },
+            _ => Err(Error::oos(
+                "FixedSizeListArray expects DataType::FixedSizeList",
+            )),
+        }
+    }
+
+    pub(crate) fn get_child_and_size(data_type: &DataType) -> (&Field, usize) {
+        Self::try_child_and_size(data_type).unwrap()
+    }
+
+    /// Returns a [`DataType`] consistent with [`FixedSizeListArray`].
+    pub fn default_datatype(data_type: DataType, size: usize) -> DataType {
+        let field = Box::new(Field::new("item", data_type, true));
+        DataType::FixedSizeList(field, size)
+    }
+}
+
+impl Array for FixedSizeListArray {
+    impl_common_array!();
+
+    fn validity(&self) -> Option<&Bitmap> {
+        self.validity.as_ref()
+    }
+
+    #[inline]
+    fn with_validity(&self, validity: Option<Bitmap>) -> Box<dyn Array> {
+        Box::new(self.clone().with_validity(validity))
+    }
+}
diff --git a/crates/nano-arrow/src/array/fixed_size_list/mutable.rs b/crates/nano-arrow/src/array/fixed_size_list/mutable.rs
new file mode 100644
index 000000000000..bef25a1cbf1f
--- /dev/null
+++ b/crates/nano-arrow/src/array/fixed_size_list/mutable.rs
@@ -0,0 +1,256 @@
+use std::sync::Arc;
+
+use super::FixedSizeListArray;
+use crate::array::physical_binary::extend_validity;
+use crate::array::{Array, MutableArray, PushUnchecked, TryExtend, TryExtendFromSelf, TryPush};
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::{DataType, Field};
+use crate::error::{Error, Result};
+
+/// The mutable version of [`FixedSizeListArray`].
+#[derive(Debug, Clone)]
+pub struct MutableFixedSizeListArray<M: MutableArray> {
+    data_type: DataType,
+    size: usize,
+    values: M,
+    validity: Option<MutableBitmap>,
+}
+
+impl<M: MutableArray> From<MutableFixedSizeListArray<M>> for FixedSizeListArray {
+    fn from(mut other: MutableFixedSizeListArray<M>) -> Self {
+        FixedSizeListArray::new(
+            other.data_type,
+            other.values.as_box(),
+            other.validity.map(|x| x.into()),
+        )
+    }
+}
+
+impl<M: MutableArray> MutableFixedSizeListArray<M> {
+    /// Creates a new [`MutableFixedSizeListArray`] from a [`MutableArray`] and size.
+    pub fn new(values: M, size: usize) -> Self {
+        let data_type = FixedSizeListArray::default_datatype(values.data_type().clone(), size);
+        Self::new_from(values, data_type, size)
+    }
+
+    /// Creates a new [`MutableFixedSizeListArray`] from a [`MutableArray`] and size.
+    pub fn new_with_field(values: M, name: &str, nullable: bool, size: usize) -> Self {
+        let data_type = DataType::FixedSizeList(
+            Box::new(Field::new(name, values.data_type().clone(), nullable)),
+            size,
+        );
+        Self::new_from(values, data_type, size)
+    }
+
+    /// Creates a new [`MutableFixedSizeListArray`] from a [`MutableArray`], [`DataType`] and size.
+    pub fn new_from(values: M, data_type: DataType, size: usize) -> Self {
+        assert_eq!(values.len(), 0);
+        match data_type {
+            DataType::FixedSizeList(..) => (),
+            _ => panic!("data type must be FixedSizeList (got {data_type:?})"),
+        };
+        Self {
+            size,
+            data_type,
+            values,
+            validity: None,
+        }
+    }
+
+    /// Returns the size (number of elements per slot) of this [`FixedSizeListArray`].
+    pub const fn size(&self) -> usize {
+        self.size
+    }
+
+    /// The length of this array
+    pub fn len(&self) -> usize {
+        self.values.len() / self.size
+    }
+
+    /// The inner values
+    pub fn values(&self) -> &M {
+        &self.values
+    }
+
+    /// The values as a mutable reference
+    pub fn mut_values(&mut self) -> &mut M {
+        &mut self.values
+    }
+
+    fn init_validity(&mut self) {
+        let len = self.values.len() / self.size;
+
+        let mut validity = MutableBitmap::new();
+        validity.extend_constant(len, true);
+        validity.set(len - 1, false);
+        self.validity = Some(validity)
+    }
+
+    #[inline]
+    /// Needs to be called when a valid value was extended to this array.
+    /// This is a relatively low level function, prefer `try_push` when you can.
+    pub fn try_push_valid(&mut self) -> Result<()> {
+        if self.values.len() % self.size != 0 {
+            return Err(Error::Overflow);
+        };
+        if let Some(validity) = &mut self.validity {
+            validity.push(true)
+        }
+        Ok(())
+    }
+
+    #[inline]
+    /// Needs to be called when a valid value was extended to this array.
+    /// This is a relatively low level function, prefer `try_push` when you can.
+    pub fn push_valid(&mut self) {
+        if let Some(validity) = &mut self.validity {
+            validity.push(true)
+        }
+    }
+
+    #[inline]
+    fn push_null(&mut self) {
+        (0..self.size).for_each(|_| self.values.push_null());
+        match &mut self.validity {
+            Some(validity) => validity.push(false),
+            None => self.init_validity(),
+        }
+    }
+
+    /// Reserves `additional` slots.
+    pub fn reserve(&mut self, additional: usize) {
+        self.values.reserve(additional);
+        if let Some(x) = self.validity.as_mut() {
+            x.reserve(additional)
+        }
+    }
+
+    /// Shrinks the capacity of the [`MutableFixedSizeListArray`] to fit its current length.
+    pub fn shrink_to_fit(&mut self) {
+        self.values.shrink_to_fit();
+        if let Some(validity) = &mut self.validity {
+            validity.shrink_to_fit()
+        }
+    }
+}
+
+impl<M: MutableArray + 'static> MutableArray for MutableFixedSizeListArray<M> {
+    fn len(&self) -> usize {
+        self.values.len() / self.size
+    }
+
+    fn validity(&self) -> Option<&MutableBitmap> {
+        self.validity.as_ref()
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        FixedSizeListArray::new(
+            self.data_type.clone(),
+            self.values.as_box(),
+            std::mem::take(&mut self.validity).map(|x| x.into()),
+        )
+        .boxed()
+    }
+
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        FixedSizeListArray::new(
+            self.data_type.clone(),
+            self.values.as_box(),
+            std::mem::take(&mut self.validity).map(|x| x.into()),
+        )
+        .arced()
+    }
+
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    fn as_mut_any(&mut self) -> &mut dyn std::any::Any {
+        self
+    }
+
+    #[inline]
+    fn push_null(&mut self) {
+        (0..self.size).for_each(|_| {
+            self.values.push_null();
+        });
+        if let Some(validity) = &mut self.validity {
+            validity.push(false)
+        } else {
+            self.init_validity()
+        }
+    }
+
+    fn reserve(&mut self, additional: usize) {
+        self.reserve(additional)
+    }
+
+    fn shrink_to_fit(&mut self) {
+        self.shrink_to_fit()
+    }
+}
+
+impl<M, I, T> TryExtend<Option<I>> for MutableFixedSizeListArray<M>
+where
+    M: MutableArray + TryExtend<Option<T>>,
+    I: IntoIterator<Item = Option<T>>,
+{
+    #[inline]
+    fn try_extend<II: IntoIterator<Item = Option<I>>>(&mut self, iter: II) -> Result<()> {
+        for items in iter {
+            self.try_push(items)?;
+        }
+        Ok(())
+    }
+}
+
+impl<M, I, T> TryPush<Option<I>> for MutableFixedSizeListArray<M>
+where
+    M: MutableArray + TryExtend<Option<T>>,
+    I: IntoIterator<Item = Option<T>>,
+{
+    #[inline]
+    fn try_push(&mut self, item: Option<I>) -> Result<()> {
+        if let Some(items) = item {
+            self.values.try_extend(items)?;
+            self.try_push_valid()?;
+        } else {
+            self.push_null();
+        }
+        Ok(())
+    }
+}
+
+impl<M, I, T> PushUnchecked<Option<I>> for MutableFixedSizeListArray<M>
+where
+    M: MutableArray + Extend<Option<T>>,
+    I: IntoIterator<Item = Option<T>>,
+{
+    /// # Safety
+    /// The caller must ensure that the `I` iterates exactly over `size`
+    /// items, where `size` is the fixed size width.
+    #[inline]
+    unsafe fn push_unchecked(&mut self, item: Option<I>) {
+        if let Some(items) = item {
+            self.values.extend(items);
+            self.push_valid();
+        } else {
+            self.push_null();
+        }
+    }
+}
+
+impl<M> TryExtendFromSelf for MutableFixedSizeListArray<M>
+where
+    M: MutableArray + TryExtendFromSelf,
+{
+    fn try_extend_from_self(&mut self, other: &Self) -> Result<()> {
+        extend_validity(self.len(), &mut self.validity, &other.validity);
+
+        self.values.try_extend_from_self(&other.values)
+    }
+}
diff --git a/crates/nano-arrow/src/array/fmt.rs b/crates/nano-arrow/src/array/fmt.rs
new file mode 100644
index 000000000000..ebc6937714cc
--- /dev/null
+++ b/crates/nano-arrow/src/array/fmt.rs
@@ -0,0 +1,181 @@
+use std::fmt::{Result, Write};
+
+use super::Array;
+use crate::bitmap::Bitmap;
+
+/// Returns a function that writes the value of the element of `array`
+/// at position `index` to a [`Write`],
+/// writing `null` in the null slots.
+pub fn get_value_display<'a, F: Write + 'a>(
+    array: &'a dyn Array,
+    null: &'static str,
+) -> Box<dyn Fn(&mut F, usize) -> Result + 'a> {
+    use crate::datatypes::PhysicalType::*;
+    match array.data_type().to_physical_type() {
+        Null => Box::new(move |f, _| write!(f, "{null}")),
+        Boolean => Box::new(|f, index| {
+            super::boolean::fmt::write_value(array.as_any().downcast_ref().unwrap(), index, f)
+        }),
+        Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+            let writer = super::primitive::fmt::get_write_value::<$T, _>(
+                array.as_any().downcast_ref().unwrap(),
+            );
+            Box::new(move |f, index| writer(f, index))
+        }),
+        Binary => Box::new(|f, index| {
+            super::binary::fmt::write_value::<i32, _>(
+                array.as_any().downcast_ref().unwrap(),
+                index,
+                f,
+            )
+        }),
+        FixedSizeBinary => Box::new(|f, index| {
+            super::fixed_size_binary::fmt::write_value(
+                array.as_any().downcast_ref().unwrap(),
+                index,
+                f,
+            )
+        }),
+        LargeBinary => Box::new(|f, index| {
+            super::binary::fmt::write_value::<i64, _>(
+                array.as_any().downcast_ref().unwrap(),
+                index,
+                f,
+            )
+        }),
+        Utf8 => Box::new(|f, index| {
+            super::utf8::fmt::write_value::<i32, _>(
+                array.as_any().downcast_ref().unwrap(),
+                index,
+                f,
+            )
+        }),
+        LargeUtf8 => Box::new(|f, index| {
+            super::utf8::fmt::write_value::<i64, _>(
+                array.as_any().downcast_ref().unwrap(),
+                index,
+                f,
+            )
+        }),
+        List => Box::new(move |f, index| {
+            super::list::fmt::write_value::<i32, _>(
+                array.as_any().downcast_ref().unwrap(),
+                index,
+                null,
+                f,
+            )
+        }),
+        FixedSizeList => Box::new(move |f, index| {
+            super::fixed_size_list::fmt::write_value(
+                array.as_any().downcast_ref().unwrap(),
+                index,
+                null,
+                f,
+            )
+        }),
+        LargeList => Box::new(move |f, index| {
+            super::list::fmt::write_value::<i64, _>(
+                array.as_any().downcast_ref().unwrap(),
+                index,
+                null,
+                f,
+            )
+        }),
+        Struct => Box::new(move |f, index| {
+            super::struct_::fmt::write_value(array.as_any().downcast_ref().unwrap(), index, null, f)
+        }),
+        Union => Box::new(move |f, index| {
+            super::union::fmt::write_value(array.as_any().downcast_ref().unwrap(), index, null, f)
+        }),
+        Map => Box::new(move |f, index| {
+            super::map::fmt::write_value(array.as_any().downcast_ref().unwrap(), index, null, f)
+        }),
+        Dictionary(key_type) => match_integer_type!(key_type, |$T| {
+            Box::new(move |f, index| {
+                super::dictionary::fmt::write_value::<$T,_>(array.as_any().downcast_ref().unwrap(), index, null, f)
+            })
+        }),
+    }
+}
+
+/// Returns a function that writes the element of `array`
+/// at position `index` to a [`Write`], writing `null` to the null slots.
+pub fn get_display<'a, F: Write + 'a>(
+    array: &'a dyn Array,
+    null: &'static str,
+) -> Box<dyn Fn(&mut F, usize) -> Result + 'a> {
+    let value_display = get_value_display(array, null);
+    Box::new(move |f, row| {
+        if array.is_null(row) {
+            f.write_str(null)
+        } else {
+            value_display(f, row)
+        }
+    })
+}
+
+pub fn write_vec<D, F>(
+    f: &mut F,
+    d: D,
+    validity: Option<&Bitmap>,
+    len: usize,
+    null: &'static str,
+    new_lines: bool,
+) -> Result
+where
+    D: Fn(&mut F, usize) -> Result,
+    F: Write,
+{
+    f.write_char('[')?;
+    write_list(f, d, validity, len, null, new_lines)?;
+    f.write_char(']')?;
+    Ok(())
+}
+
+fn write_list<D, F>(
+    f: &mut F,
+    d: D,
+    validity: Option<&Bitmap>,
+    len: usize,
+    null: &'static str,
+    new_lines: bool,
+) -> Result
+where
+    D: Fn(&mut F, usize) -> Result,
+    F: Write,
+{
+    for index in 0..len {
+        if index != 0 {
+            f.write_char(',')?;
+            f.write_char(if new_lines { '\n' } else { ' ' })?;
+        }
+        if let Some(val) = validity {
+            if val.get_bit(index) {
+                d(f, index)
+            } else {
+                write!(f, "{null}")
+            }
+        } else {
+            d(f, index)
+        }?;
+    }
+    Ok(())
+}
+
+pub fn write_map<D, F>(
+    f: &mut F,
+    d: D,
+    validity: Option<&Bitmap>,
+    len: usize,
+    null: &'static str,
+    new_lines: bool,
+) -> Result
+where
+    D: Fn(&mut F, usize) -> Result,
+    F: Write,
+{
+    f.write_char('{')?;
+    write_list(f, d, validity, len, null, new_lines)?;
+    f.write_char('}')?;
+    Ok(())
+}
diff --git a/crates/nano-arrow/src/array/growable/binary.rs b/crates/nano-arrow/src/array/growable/binary.rs
new file mode 100644
index 000000000000..ca095f351446
--- /dev/null
+++ b/crates/nano-arrow/src/array/growable/binary.rs
@@ -0,0 +1,102 @@
+use std::sync::Arc;
+
+use super::utils::{build_extend_null_bits, extend_offset_values, ExtendNullBits};
+use super::Growable;
+use crate::array::{Array, BinaryArray};
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::DataType;
+use crate::offset::{Offset, Offsets};
+
+/// Concrete [`Growable`] for the [`BinaryArray`].
+pub struct GrowableBinary<'a, O: Offset> {
+    arrays: Vec<&'a BinaryArray<O>>,
+    data_type: DataType,
+    validity: MutableBitmap,
+    values: Vec<u8>,
+    offsets: Offsets<O>,
+    extend_null_bits: Vec<ExtendNullBits<'a>>,
+}
+
+impl<'a, O: Offset> GrowableBinary<'a, O> {
+    /// Creates a new [`GrowableBinary`] bound to `arrays` with a pre-allocated `capacity`.
+    /// # Panics
+    /// If `arrays` is empty.
+    pub fn new(arrays: Vec<&'a BinaryArray<O>>, mut use_validity: bool, capacity: usize) -> Self {
+        let data_type = arrays[0].data_type().clone();
+
+        // if any of the arrays has nulls, insertions from any array requires setting bits
+        // as there is at least one array with nulls.
+        if !use_validity & arrays.iter().any(|array| array.null_count() > 0) {
+            use_validity = true;
+        };
+
+        let extend_null_bits = arrays
+            .iter()
+            .map(|array| build_extend_null_bits(*array, use_validity))
+            .collect();
+
+        Self {
+            arrays,
+            data_type,
+            values: Vec::with_capacity(0),
+            offsets: Offsets::with_capacity(capacity),
+            validity: MutableBitmap::with_capacity(capacity),
+            extend_null_bits,
+        }
+    }
+
+    fn to(&mut self) -> BinaryArray<O> {
+        let data_type = self.data_type.clone();
+        let validity = std::mem::take(&mut self.validity);
+        let offsets = std::mem::take(&mut self.offsets);
+        let values = std::mem::take(&mut self.values);
+
+        BinaryArray::<O>::new(data_type, offsets.into(), values.into(), validity.into())
+    }
+}
+
+impl<'a, O: Offset> Growable<'a> for GrowableBinary<'a, O> {
+    fn extend(&mut self, index: usize, start: usize, len: usize) {
+        (self.extend_null_bits[index])(&mut self.validity, start, len);
+
+        let array = self.arrays[index];
+        let offsets = array.offsets();
+        let values = array.values();
+
+        self.offsets
+            .try_extend_from_slice(offsets, start, len)
+            .unwrap();
+
+        // values
+        extend_offset_values::<O>(&mut self.values, offsets.buffer(), values, start, len);
+    }
+
+    fn extend_validity(&mut self, additional: usize) {
+        self.offsets.extend_constant(additional);
+        self.validity.extend_constant(additional, false);
+    }
+
+    #[inline]
+    fn len(&self) -> usize {
+        self.offsets.len() - 1
+    }
+
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        self.to().arced()
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        self.to().boxed()
+    }
+}
+
+impl<'a, O: Offset> From<GrowableBinary<'a, O>> for BinaryArray<O> {
+    fn from(val: GrowableBinary<'a, O>) -> Self {
+        BinaryArray::<O>::new(
+            val.data_type,
+            val.offsets.into(),
+            val.values.into(),
+            val.validity.into(),
+        )
+    }
+}
diff --git a/crates/nano-arrow/src/array/growable/boolean.rs b/crates/nano-arrow/src/array/growable/boolean.rs
new file mode 100644
index 000000000000..f69d66f1d696
--- /dev/null
+++ b/crates/nano-arrow/src/array/growable/boolean.rs
@@ -0,0 +1,91 @@
+use std::sync::Arc;
+
+use super::utils::{build_extend_null_bits, ExtendNullBits};
+use super::Growable;
+use crate::array::{Array, BooleanArray};
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::DataType;
+
+/// Concrete [`Growable`] for the [`BooleanArray`].
+pub struct GrowableBoolean<'a> {
+    arrays: Vec<&'a BooleanArray>,
+    data_type: DataType,
+    validity: MutableBitmap,
+    values: MutableBitmap,
+    extend_null_bits: Vec<ExtendNullBits<'a>>,
+}
+
+impl<'a> GrowableBoolean<'a> {
+    /// Creates a new [`GrowableBoolean`] bound to `arrays` with a pre-allocated `capacity`.
+    /// # Panics
+    /// If `arrays` is empty.
+    pub fn new(arrays: Vec<&'a BooleanArray>, mut use_validity: bool, capacity: usize) -> Self {
+        let data_type = arrays[0].data_type().clone();
+
+        // if any of the arrays has nulls, insertions from any array requires setting bits
+        // as there is at least one array with nulls.
+        if !use_validity & arrays.iter().any(|array| array.null_count() > 0) {
+            use_validity = true;
+        };
+
+        let extend_null_bits = arrays
+            .iter()
+            .map(|array| build_extend_null_bits(*array, use_validity))
+            .collect();
+
+        Self {
+            arrays,
+            data_type,
+            values: MutableBitmap::with_capacity(capacity),
+            validity: MutableBitmap::with_capacity(capacity),
+            extend_null_bits,
+        }
+    }
+
+    fn to(&mut self) -> BooleanArray {
+        let validity = std::mem::take(&mut self.validity);
+        let values = std::mem::take(&mut self.values);
+
+        BooleanArray::new(self.data_type.clone(), values.into(), validity.into())
+    }
+}
+
+impl<'a> Growable<'a> for GrowableBoolean<'a> {
+    fn extend(&mut self, index: usize, start: usize, len: usize) {
+        (self.extend_null_bits[index])(&mut self.validity, start, len);
+
+        let array = self.arrays[index];
+        let values = array.values();
+
+        let (slice, offset, _) = values.as_slice();
+        // safety: invariant offset + length <= slice.len()
+        unsafe {
+            self.values
+                .extend_from_slice_unchecked(slice, start + offset, len);
+        }
+    }
+
+    fn extend_validity(&mut self, additional: usize) {
+        self.values.extend_constant(additional, false);
+        self.validity.extend_constant(additional, false);
+    }
+
+    #[inline]
+    fn len(&self) -> usize {
+        self.values.len()
+    }
+
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        Arc::new(self.to())
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        Box::new(self.to())
+    }
+}
+
+impl<'a> From<GrowableBoolean<'a>> for BooleanArray {
+    fn from(val: GrowableBoolean<'a>) -> Self {
+        BooleanArray::new(val.data_type, val.values.into(), val.validity.into())
+    }
+}
diff --git a/crates/nano-arrow/src/array/growable/dictionary.rs b/crates/nano-arrow/src/array/growable/dictionary.rs
new file mode 100644
index 000000000000..fa85cdad6f8e
--- /dev/null
+++ b/crates/nano-arrow/src/array/growable/dictionary.rs
@@ -0,0 +1,157 @@
+use std::sync::Arc;
+
+use super::utils::{build_extend_null_bits, ExtendNullBits};
+use super::{make_growable, Growable};
+use crate::array::{Array, DictionaryArray, DictionaryKey, PrimitiveArray};
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::DataType;
+
+/// Concrete [`Growable`] for the [`DictionaryArray`].
+/// # Implementation
+/// This growable does not perform collision checks and instead concatenates
+/// the values of each [`DictionaryArray`] one after the other.
+pub struct GrowableDictionary<'a, K: DictionaryKey> {
+    data_type: DataType,
+    keys_values: Vec<&'a [K]>,
+    key_values: Vec<K>,
+    key_validity: MutableBitmap,
+    offsets: Vec<usize>,
+    values: Box<dyn Array>,
+    extend_null_bits: Vec<ExtendNullBits<'a>>,
+}
+
+fn concatenate_values<K: DictionaryKey>(
+    arrays_keys: &[&PrimitiveArray<K>],
+    arrays_values: &[&dyn Array],
+    capacity: usize,
+) -> (Box<dyn Array>, Vec<usize>) {
+    let mut mutable = make_growable(arrays_values, false, capacity);
+    let mut offsets = Vec::with_capacity(arrays_keys.len() + 1);
+    offsets.push(0);
+    for (i, values) in arrays_values.iter().enumerate() {
+        mutable.extend(i, 0, values.len());
+        offsets.push(offsets[i] + values.len());
+    }
+    (mutable.as_box(), offsets)
+}
+
+impl<'a, T: DictionaryKey> GrowableDictionary<'a, T> {
+    /// Creates a new [`GrowableDictionary`] bound to `arrays` with a pre-allocated `capacity`.
+    /// # Panics
+    /// If `arrays` is empty.
+    pub fn new(arrays: &[&'a DictionaryArray<T>], mut use_validity: bool, capacity: usize) -> Self {
+        let data_type = arrays[0].data_type().clone();
+
+        // if any of the arrays has nulls, insertions from any array requires setting bits
+        // as there is at least one array with nulls.
+        if arrays.iter().any(|array| array.null_count() > 0) {
+            use_validity = true;
+        };
+
+        let arrays_keys = arrays.iter().map(|array| array.keys()).collect::<Vec<_>>();
+        let keys_values = arrays_keys
+            .iter()
+            .map(|array| array.values().as_slice())
+            .collect::<Vec<_>>();
+
+        let extend_null_bits = arrays
+            .iter()
+            .map(|array| build_extend_null_bits(array.keys(), use_validity))
+            .collect();
+
+        let arrays_values = arrays
+            .iter()
+            .map(|array| array.values().as_ref())
+            .collect::<Vec<_>>();
+
+        let (values, offsets) = concatenate_values(&arrays_keys, &arrays_values, capacity);
+
+        Self {
+            data_type,
+            offsets,
+            values,
+            keys_values,
+            key_values: Vec::with_capacity(capacity),
+            key_validity: MutableBitmap::with_capacity(capacity),
+            extend_null_bits,
+        }
+    }
+
+    #[inline]
+    fn to(&mut self) -> DictionaryArray<T> {
+        let validity = std::mem::take(&mut self.key_validity);
+        let key_values = std::mem::take(&mut self.key_values);
+
+        #[cfg(debug_assertions)]
+        {
+            crate::array::specification::check_indexes(&key_values, self.values.len()).unwrap();
+        }
+        let keys =
+            PrimitiveArray::<T>::new(T::PRIMITIVE.into(), key_values.into(), validity.into());
+
+        // Safety - the invariant of this struct ensures that this is up-held
+        unsafe {
+            DictionaryArray::<T>::try_new_unchecked(
+                self.data_type.clone(),
+                keys,
+                self.values.clone(),
+            )
+            .unwrap()
+        }
+    }
+}
+
+impl<'a, T: DictionaryKey> Growable<'a> for GrowableDictionary<'a, T> {
+    #[inline]
+    fn extend(&mut self, index: usize, start: usize, len: usize) {
+        (self.extend_null_bits[index])(&mut self.key_validity, start, len);
+
+        let values = &self.keys_values[index][start..start + len];
+        let offset = self.offsets[index];
+        self.key_values.extend(
+            values
+                .iter()
+                // `.unwrap_or(0)` because this operation does not check for null values, which may contain any key.
+                .map(|x| {
+                    let x: usize = offset + (*x).try_into().unwrap_or(0);
+                    let x: T = match x.try_into() {
+                        Ok(key) => key,
+                        // todo: convert this to an error.
+                        Err(_) => {
+                            panic!("The maximum key is too small")
+                        },
+                    };
+                    x
+                }),
+        );
+    }
+
+    #[inline]
+    fn len(&self) -> usize {
+        self.key_values.len()
+    }
+
+    #[inline]
+    fn extend_validity(&mut self, additional: usize) {
+        self.key_values
+            .resize(self.key_values.len() + additional, T::default());
+        self.key_validity.extend_constant(additional, false);
+    }
+
+    #[inline]
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        Arc::new(self.to())
+    }
+
+    #[inline]
+    fn as_box(&mut self) -> Box<dyn Array> {
+        Box::new(self.to())
+    }
+}
+
+impl<'a, T: DictionaryKey> From<GrowableDictionary<'a, T>> for DictionaryArray<T> {
+    #[inline]
+    fn from(mut val: GrowableDictionary<'a, T>) -> Self {
+        val.to()
+    }
+}
diff --git a/crates/nano-arrow/src/array/growable/fixed_binary.rs b/crates/nano-arrow/src/array/growable/fixed_binary.rs
new file mode 100644
index 000000000000..bc6b307f97f9
--- /dev/null
+++ b/crates/nano-arrow/src/array/growable/fixed_binary.rs
@@ -0,0 +1,98 @@
+use std::sync::Arc;
+
+use super::utils::{build_extend_null_bits, ExtendNullBits};
+use super::Growable;
+use crate::array::{Array, FixedSizeBinaryArray};
+use crate::bitmap::MutableBitmap;
+
+/// Concrete [`Growable`] for the [`FixedSizeBinaryArray`].
+pub struct GrowableFixedSizeBinary<'a> {
+    arrays: Vec<&'a FixedSizeBinaryArray>,
+    validity: MutableBitmap,
+    values: Vec<u8>,
+    extend_null_bits: Vec<ExtendNullBits<'a>>,
+    size: usize, // just a cache
+}
+
+impl<'a> GrowableFixedSizeBinary<'a> {
+    /// Creates a new [`GrowableFixedSizeBinary`] bound to `arrays` with a pre-allocated `capacity`.
+    /// # Panics
+    /// If `arrays` is empty.
+    pub fn new(
+        arrays: Vec<&'a FixedSizeBinaryArray>,
+        mut use_validity: bool,
+        capacity: usize,
+    ) -> Self {
+        // if any of the arrays has nulls, insertions from any array requires setting bits
+        // as there is at least one array with nulls.
+        if arrays.iter().any(|array| array.null_count() > 0) {
+            use_validity = true;
+        };
+
+        let extend_null_bits = arrays
+            .iter()
+            .map(|array| build_extend_null_bits(*array, use_validity))
+            .collect();
+
+        let size = FixedSizeBinaryArray::get_size(arrays[0].data_type());
+        Self {
+            arrays,
+            values: Vec::with_capacity(0),
+            validity: MutableBitmap::with_capacity(capacity),
+            extend_null_bits,
+            size,
+        }
+    }
+
+    fn to(&mut self) -> FixedSizeBinaryArray {
+        let validity = std::mem::take(&mut self.validity);
+        let values = std::mem::take(&mut self.values);
+
+        FixedSizeBinaryArray::new(
+            self.arrays[0].data_type().clone(),
+            values.into(),
+            validity.into(),
+        )
+    }
+}
+
+impl<'a> Growable<'a> for GrowableFixedSizeBinary<'a> {
+    fn extend(&mut self, index: usize, start: usize, len: usize) {
+        (self.extend_null_bits[index])(&mut self.validity, start, len);
+
+        let array = self.arrays[index];
+        let values = array.values();
+
+        self.values
+            .extend_from_slice(&values[start * self.size..start * self.size + len * self.size]);
+    }
+
+    fn extend_validity(&mut self, additional: usize) {
+        self.values
+            .extend_from_slice(&vec![0; self.size * additional]);
+        self.validity.extend_constant(additional, false);
+    }
+
+    #[inline]
+    fn len(&self) -> usize {
+        self.values.len() / self.size
+    }
+
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        Arc::new(self.to())
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        Box::new(self.to())
+    }
+}
+
+impl<'a> From<GrowableFixedSizeBinary<'a>> for FixedSizeBinaryArray {
+    fn from(val: GrowableFixedSizeBinary<'a>) -> Self {
+        FixedSizeBinaryArray::new(
+            val.arrays[0].data_type().clone(),
+            val.values.into(),
+            val.validity.into(),
+        )
+    }
+}
diff --git a/crates/nano-arrow/src/array/growable/fixed_size_list.rs b/crates/nano-arrow/src/array/growable/fixed_size_list.rs
new file mode 100644
index 000000000000..cacad36bb4a7
--- /dev/null
+++ b/crates/nano-arrow/src/array/growable/fixed_size_list.rs
@@ -0,0 +1,107 @@
+use std::sync::Arc;
+
+use super::utils::{build_extend_null_bits, ExtendNullBits};
+use super::{make_growable, Growable};
+use crate::array::{Array, FixedSizeListArray};
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::DataType;
+
+/// Concrete [`Growable`] for the [`FixedSizeListArray`].
+pub struct GrowableFixedSizeList<'a> {
+    arrays: Vec<&'a FixedSizeListArray>,
+    validity: MutableBitmap,
+    values: Box<dyn Growable<'a> + 'a>,
+    extend_null_bits: Vec<ExtendNullBits<'a>>,
+    size: usize,
+}
+
+impl<'a> GrowableFixedSizeList<'a> {
+    /// Creates a new [`GrowableFixedSizeList`] bound to `arrays` with a pre-allocated `capacity`.
+    /// # Panics
+    /// If `arrays` is empty.
+    pub fn new(
+        arrays: Vec<&'a FixedSizeListArray>,
+        mut use_validity: bool,
+        capacity: usize,
+    ) -> Self {
+        assert!(!arrays.is_empty());
+
+        // if any of the arrays has nulls, insertions from any array requires setting bits
+        // as there is at least one array with nulls.
+        if !use_validity & arrays.iter().any(|array| array.null_count() > 0) {
+            use_validity = true;
+        };
+
+        let size =
+            if let DataType::FixedSizeList(_, size) = &arrays[0].data_type().to_logical_type() {
+                *size
+            } else {
+                unreachable!("`GrowableFixedSizeList` expects `DataType::FixedSizeList`")
+            };
+
+        let extend_null_bits = arrays
+            .iter()
+            .map(|array| build_extend_null_bits(*array, use_validity))
+            .collect();
+
+        let inner = arrays
+            .iter()
+            .map(|array| array.values().as_ref())
+            .collect::<Vec<_>>();
+        let values = make_growable(&inner, use_validity, 0);
+
+        Self {
+            arrays,
+            values,
+            validity: MutableBitmap::with_capacity(capacity),
+            extend_null_bits,
+            size,
+        }
+    }
+
+    fn to(&mut self) -> FixedSizeListArray {
+        let validity = std::mem::take(&mut self.validity);
+        let values = self.values.as_box();
+
+        FixedSizeListArray::new(self.arrays[0].data_type().clone(), values, validity.into())
+    }
+}
+
+impl<'a> Growable<'a> for GrowableFixedSizeList<'a> {
+    fn extend(&mut self, index: usize, start: usize, len: usize) {
+        (self.extend_null_bits[index])(&mut self.validity, start, len);
+        self.values
+            .extend(index, start * self.size, len * self.size);
+    }
+
+    fn extend_validity(&mut self, additional: usize) {
+        self.values.extend_validity(additional * self.size);
+        self.validity.extend_constant(additional, false);
+    }
+
+    #[inline]
+    fn len(&self) -> usize {
+        self.values.len() / self.size
+    }
+
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        Arc::new(self.to())
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        Box::new(self.to())
+    }
+}
+
+impl<'a> From<GrowableFixedSizeList<'a>> for FixedSizeListArray {
+    fn from(val: GrowableFixedSizeList<'a>) -> Self {
+        let mut values = val.values;
+        let values = values.as_box();
+
+        Self::new(
+            val.arrays[0].data_type().clone(),
+            values,
+            val.validity.into(),
+        )
+    }
+}
diff --git a/crates/nano-arrow/src/array/growable/list.rs b/crates/nano-arrow/src/array/growable/list.rs
new file mode 100644
index 000000000000..9fdf9eb047bf
--- /dev/null
+++ b/crates/nano-arrow/src/array/growable/list.rs
@@ -0,0 +1,112 @@
+use std::sync::Arc;
+
+use super::utils::{build_extend_null_bits, ExtendNullBits};
+use super::{make_growable, Growable};
+use crate::array::{Array, ListArray};
+use crate::bitmap::MutableBitmap;
+use crate::offset::{Offset, Offsets};
+
+fn extend_offset_values<O: Offset>(
+    growable: &mut GrowableList<'_, O>,
+    index: usize,
+    start: usize,
+    len: usize,
+) {
+    let array = growable.arrays[index];
+    let offsets = array.offsets();
+
+    growable
+        .offsets
+        .try_extend_from_slice(offsets, start, len)
+        .unwrap();
+
+    let end = offsets.buffer()[start + len].to_usize();
+    let start = offsets.buffer()[start].to_usize();
+    let len = end - start;
+    growable.values.extend(index, start, len);
+}
+
+/// Concrete [`Growable`] for the [`ListArray`].
+pub struct GrowableList<'a, O: Offset> {
+    arrays: Vec<&'a ListArray<O>>,
+    validity: MutableBitmap,
+    values: Box<dyn Growable<'a> + 'a>,
+    offsets: Offsets<O>,
+    extend_null_bits: Vec<ExtendNullBits<'a>>,
+}
+
+impl<'a, O: Offset> GrowableList<'a, O> {
+    /// Creates a new [`GrowableList`] bound to `arrays` with a pre-allocated `capacity`.
+    /// # Panics
+    /// If `arrays` is empty.
+    pub fn new(arrays: Vec<&'a ListArray<O>>, mut use_validity: bool, capacity: usize) -> Self {
+        // if any of the arrays has nulls, insertions from any array requires setting bits
+        // as there is at least one array with nulls.
+        if !use_validity & arrays.iter().any(|array| array.null_count() > 0) {
+            use_validity = true;
+        };
+
+        let extend_null_bits = arrays
+            .iter()
+            .map(|array| build_extend_null_bits(*array, use_validity))
+            .collect();
+
+        let inner = arrays
+            .iter()
+            .map(|array| array.values().as_ref())
+            .collect::<Vec<_>>();
+        let values = make_growable(&inner, use_validity, 0);
+
+        Self {
+            arrays,
+            offsets: Offsets::with_capacity(capacity),
+            values,
+            validity: MutableBitmap::with_capacity(capacity),
+            extend_null_bits,
+        }
+    }
+
+    fn to(&mut self) -> ListArray<O> {
+        let validity = std::mem::take(&mut self.validity);
+        let offsets = std::mem::take(&mut self.offsets);
+        let values = self.values.as_box();
+
+        ListArray::<O>::new(
+            self.arrays[0].data_type().clone(),
+            offsets.into(),
+            values,
+            validity.into(),
+        )
+    }
+}
+
+impl<'a, O: Offset> Growable<'a> for GrowableList<'a, O> {
+    fn extend(&mut self, index: usize, start: usize, len: usize) {
+        (self.extend_null_bits[index])(&mut self.validity, start, len);
+        extend_offset_values::<O>(self, index, start, len);
+    }
+
+    fn extend_validity(&mut self, additional: usize) {
+        self.offsets.extend_constant(additional);
+        self.validity.extend_constant(additional, false);
+    }
+
+    #[inline]
+    fn len(&self) -> usize {
+        self.offsets.len() - 1
+    }
+
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        Arc::new(self.to())
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        Box::new(self.to())
+    }
+}
+
+impl<'a, O: Offset> From<GrowableList<'a, O>> for ListArray<O> {
+    fn from(mut val: GrowableList<'a, O>) -> Self {
+        val.to()
+    }
+}
diff --git a/crates/nano-arrow/src/array/growable/map.rs b/crates/nano-arrow/src/array/growable/map.rs
new file mode 100644
index 000000000000..62f9d4c5c53a
--- /dev/null
+++ b/crates/nano-arrow/src/array/growable/map.rs
@@ -0,0 +1,107 @@
+use std::sync::Arc;
+
+use super::utils::{build_extend_null_bits, ExtendNullBits};
+use super::{make_growable, Growable};
+use crate::array::{Array, MapArray};
+use crate::bitmap::MutableBitmap;
+use crate::offset::Offsets;
+
+fn extend_offset_values(growable: &mut GrowableMap<'_>, index: usize, start: usize, len: usize) {
+    let array = growable.arrays[index];
+    let offsets = array.offsets();
+
+    growable
+        .offsets
+        .try_extend_from_slice(offsets, start, len)
+        .unwrap();
+
+    let end = offsets.buffer()[start + len] as usize;
+    let start = offsets.buffer()[start] as usize;
+    let len = end - start;
+    growable.values.extend(index, start, len);
+}
+
+/// Concrete [`Growable`] for the [`MapArray`].
+pub struct GrowableMap<'a> {
+    arrays: Vec<&'a MapArray>,
+    validity: MutableBitmap,
+    values: Box<dyn Growable<'a> + 'a>,
+    offsets: Offsets<i32>,
+    extend_null_bits: Vec<ExtendNullBits<'a>>,
+}
+
+impl<'a> GrowableMap<'a> {
+    /// Creates a new [`GrowableMap`] bound to `arrays` with a pre-allocated `capacity`.
+    /// # Panics
+    /// If `arrays` is empty.
+    pub fn new(arrays: Vec<&'a MapArray>, mut use_validity: bool, capacity: usize) -> Self {
+        // if any of the arrays has nulls, insertions from any array requires setting bits
+        // as there is at least one array with nulls.
+        if !use_validity & arrays.iter().any(|array| array.null_count() > 0) {
+            use_validity = true;
+        };
+
+        let extend_null_bits = arrays
+            .iter()
+            .map(|array| build_extend_null_bits(*array, use_validity))
+            .collect();
+
+        let inner = arrays
+            .iter()
+            .map(|array| array.field().as_ref())
+            .collect::<Vec<_>>();
+        let values = make_growable(&inner, use_validity, 0);
+
+        Self {
+            arrays,
+            offsets: Offsets::with_capacity(capacity),
+            values,
+            validity: MutableBitmap::with_capacity(capacity),
+            extend_null_bits,
+        }
+    }
+
+    fn to(&mut self) -> MapArray {
+        let validity = std::mem::take(&mut self.validity);
+        let offsets = std::mem::take(&mut self.offsets);
+        let values = self.values.as_box();
+
+        MapArray::new(
+            self.arrays[0].data_type().clone(),
+            offsets.into(),
+            values,
+            validity.into(),
+        )
+    }
+}
+
+impl<'a> Growable<'a> for GrowableMap<'a> {
+    fn extend(&mut self, index: usize, start: usize, len: usize) {
+        (self.extend_null_bits[index])(&mut self.validity, start, len);
+        extend_offset_values(self, index, start, len);
+    }
+
+    fn extend_validity(&mut self, additional: usize) {
+        self.offsets.extend_constant(additional);
+        self.validity.extend_constant(additional, false);
+    }
+
+    #[inline]
+    fn len(&self) -> usize {
+        self.offsets.len() - 1
+    }
+
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        Arc::new(self.to())
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        Box::new(self.to())
+    }
+}
+
+impl<'a> From<GrowableMap<'a>> for MapArray {
+    fn from(mut val: GrowableMap<'a>) -> Self {
+        val.to()
+    }
+}
diff --git a/crates/nano-arrow/src/array/growable/mod.rs b/crates/nano-arrow/src/array/growable/mod.rs
new file mode 100644
index 000000000000..a3fe4b739451
--- /dev/null
+++ b/crates/nano-arrow/src/array/growable/mod.rs
@@ -0,0 +1,149 @@
+//! Contains the trait [`Growable`] and corresponding concreate implementations, one per concrete array,
+//! that offer the ability to create a new [`Array`] out of slices of existing [`Array`]s.
+
+use std::sync::Arc;
+
+use crate::array::*;
+use crate::datatypes::*;
+
+mod binary;
+pub use binary::GrowableBinary;
+mod union;
+pub use union::GrowableUnion;
+mod boolean;
+pub use boolean::GrowableBoolean;
+mod fixed_binary;
+pub use fixed_binary::GrowableFixedSizeBinary;
+mod null;
+pub use null::GrowableNull;
+mod primitive;
+pub use primitive::GrowablePrimitive;
+mod list;
+pub use list::GrowableList;
+mod map;
+pub use map::GrowableMap;
+mod structure;
+pub use structure::GrowableStruct;
+mod fixed_size_list;
+pub use fixed_size_list::GrowableFixedSizeList;
+mod utf8;
+pub use utf8::GrowableUtf8;
+mod dictionary;
+pub use dictionary::GrowableDictionary;
+
+mod utils;
+
+/// Describes a struct that can be extended from slices of other pre-existing [`Array`]s.
+/// This is used in operations where a new array is built out of other arrays, such
+/// as filter and concatenation.
+pub trait Growable<'a> {
+    /// Extends this [`Growable`] with elements from the bounded [`Array`] at index `index` from
+    /// a slice starting at `start` and length `len`.
+    /// # Panic
+    /// This function panics if the range is out of bounds, i.e. if `start + len >= array.len()`.
+    fn extend(&mut self, index: usize, start: usize, len: usize);
+
+    /// Extends this [`Growable`] with null elements, disregarding the bound arrays
+    fn extend_validity(&mut self, additional: usize);
+
+    /// The current length of the [`Growable`].
+    fn len(&self) -> usize;
+
+    /// Converts this [`Growable`] to an [`Arc<dyn Array>`], thereby finishing the mutation.
+    /// Self will be empty after such operation.
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        self.as_box().into()
+    }
+
+    /// Converts this [`Growable`] to an [`Box<dyn Array>`], thereby finishing the mutation.
+    /// Self will be empty after such operation
+    fn as_box(&mut self) -> Box<dyn Array>;
+}
+
+macro_rules! dyn_growable {
+    ($ty:ty, $arrays:expr, $use_validity:expr, $capacity:expr) => {{
+        let arrays = $arrays
+            .iter()
+            .map(|array| array.as_any().downcast_ref().unwrap())
+            .collect::<Vec<_>>();
+        Box::new(<$ty>::new(arrays, $use_validity, $capacity))
+    }};
+}
+
+/// Creates a new [`Growable`] from an arbitrary number of [`Array`]s.
+/// # Panics
+/// This function panics iff
+/// * the arrays do not have the same [`DataType`].
+/// * `arrays.is_empty()`.
+pub fn make_growable<'a>(
+    arrays: &[&'a dyn Array],
+    use_validity: bool,
+    capacity: usize,
+) -> Box<dyn Growable<'a> + 'a> {
+    assert!(!arrays.is_empty());
+    let data_type = arrays[0].data_type();
+
+    use PhysicalType::*;
+    match data_type.to_physical_type() {
+        Null => Box::new(null::GrowableNull::new(data_type.clone())),
+        Boolean => dyn_growable!(boolean::GrowableBoolean, arrays, use_validity, capacity),
+        Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+            dyn_growable!(primitive::GrowablePrimitive::<$T>, arrays, use_validity, capacity)
+        }),
+        Utf8 => dyn_growable!(utf8::GrowableUtf8::<i32>, arrays, use_validity, capacity),
+        LargeUtf8 => dyn_growable!(utf8::GrowableUtf8::<i64>, arrays, use_validity, capacity),
+        Binary => dyn_growable!(
+            binary::GrowableBinary::<i32>,
+            arrays,
+            use_validity,
+            capacity
+        ),
+        LargeBinary => dyn_growable!(
+            binary::GrowableBinary::<i64>,
+            arrays,
+            use_validity,
+            capacity
+        ),
+        FixedSizeBinary => dyn_growable!(
+            fixed_binary::GrowableFixedSizeBinary,
+            arrays,
+            use_validity,
+            capacity
+        ),
+        List => dyn_growable!(list::GrowableList::<i32>, arrays, use_validity, capacity),
+        LargeList => dyn_growable!(list::GrowableList::<i64>, arrays, use_validity, capacity),
+        Struct => dyn_growable!(structure::GrowableStruct, arrays, use_validity, capacity),
+        FixedSizeList => dyn_growable!(
+            fixed_size_list::GrowableFixedSizeList,
+            arrays,
+            use_validity,
+            capacity
+        ),
+        Union => {
+            let arrays = arrays
+                .iter()
+                .map(|array| array.as_any().downcast_ref().unwrap())
+                .collect::<Vec<_>>();
+            Box::new(union::GrowableUnion::new(arrays, capacity))
+        },
+        Map => dyn_growable!(map::GrowableMap, arrays, use_validity, capacity),
+        Dictionary(key_type) => {
+            match_integer_type!(key_type, |$T| {
+                let arrays = arrays
+                    .iter()
+                    .map(|array| {
+                        array
+                            .as_any()
+                            .downcast_ref::<DictionaryArray<$T>>()
+                            .unwrap()
+                    })
+                    .collect::<Vec<_>>();
+                Box::new(dictionary::GrowableDictionary::<$T>::new(
+                    &arrays,
+                    use_validity,
+                    capacity,
+                ))
+            })
+        },
+    }
+}
diff --git a/crates/nano-arrow/src/array/growable/null.rs b/crates/nano-arrow/src/array/growable/null.rs
new file mode 100644
index 000000000000..44e1c2488b0f
--- /dev/null
+++ b/crates/nano-arrow/src/array/growable/null.rs
@@ -0,0 +1,56 @@
+use std::sync::Arc;
+
+use super::Growable;
+use crate::array::{Array, NullArray};
+use crate::datatypes::DataType;
+
+/// Concrete [`Growable`] for the [`NullArray`].
+pub struct GrowableNull {
+    data_type: DataType,
+    length: usize,
+}
+
+impl Default for GrowableNull {
+    fn default() -> Self {
+        Self::new(DataType::Null)
+    }
+}
+
+impl GrowableNull {
+    /// Creates a new [`GrowableNull`].
+    pub fn new(data_type: DataType) -> Self {
+        Self {
+            data_type,
+            length: 0,
+        }
+    }
+}
+
+impl<'a> Growable<'a> for GrowableNull {
+    fn extend(&mut self, _: usize, _: usize, len: usize) {
+        self.length += len;
+    }
+
+    fn extend_validity(&mut self, additional: usize) {
+        self.length += additional;
+    }
+
+    #[inline]
+    fn len(&self) -> usize {
+        self.length
+    }
+
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        Arc::new(NullArray::new(self.data_type.clone(), self.length))
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        Box::new(NullArray::new(self.data_type.clone(), self.length))
+    }
+}
+
+impl From<GrowableNull> for NullArray {
+    fn from(val: GrowableNull) -> Self {
+        NullArray::new(val.data_type, val.length)
+    }
+}
diff --git a/crates/nano-arrow/src/array/growable/primitive.rs b/crates/nano-arrow/src/array/growable/primitive.rs
new file mode 100644
index 000000000000..cade744a5936
--- /dev/null
+++ b/crates/nano-arrow/src/array/growable/primitive.rs
@@ -0,0 +1,101 @@
+use std::sync::Arc;
+
+use super::utils::{build_extend_null_bits, ExtendNullBits};
+use super::Growable;
+use crate::array::{Array, PrimitiveArray};
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::DataType;
+use crate::types::NativeType;
+
+/// Concrete [`Growable`] for the [`PrimitiveArray`].
+pub struct GrowablePrimitive<'a, T: NativeType> {
+    data_type: DataType,
+    arrays: Vec<&'a [T]>,
+    validity: MutableBitmap,
+    values: Vec<T>,
+    extend_null_bits: Vec<ExtendNullBits<'a>>,
+}
+
+impl<'a, T: NativeType> GrowablePrimitive<'a, T> {
+    /// Creates a new [`GrowablePrimitive`] bound to `arrays` with a pre-allocated `capacity`.
+    /// # Panics
+    /// If `arrays` is empty.
+    pub fn new(
+        arrays: Vec<&'a PrimitiveArray<T>>,
+        mut use_validity: bool,
+        capacity: usize,
+    ) -> Self {
+        // if any of the arrays has nulls, insertions from any array requires setting bits
+        // as there is at least one array with nulls.
+        if !use_validity & arrays.iter().any(|array| array.null_count() > 0) {
+            use_validity = true;
+        };
+
+        let data_type = arrays[0].data_type().clone();
+
+        let extend_null_bits = arrays
+            .iter()
+            .map(|array| build_extend_null_bits(*array, use_validity))
+            .collect();
+
+        let arrays = arrays
+            .iter()
+            .map(|array| array.values().as_slice())
+            .collect::<Vec<_>>();
+
+        Self {
+            data_type,
+            arrays,
+            values: Vec::with_capacity(capacity),
+            validity: MutableBitmap::with_capacity(capacity),
+            extend_null_bits,
+        }
+    }
+
+    #[inline]
+    fn to(&mut self) -> PrimitiveArray<T> {
+        let validity = std::mem::take(&mut self.validity);
+        let values = std::mem::take(&mut self.values);
+
+        PrimitiveArray::<T>::new(self.data_type.clone(), values.into(), validity.into())
+    }
+}
+
+impl<'a, T: NativeType> Growable<'a> for GrowablePrimitive<'a, T> {
+    #[inline]
+    fn extend(&mut self, index: usize, start: usize, len: usize) {
+        (self.extend_null_bits[index])(&mut self.validity, start, len);
+
+        let values = self.arrays[index];
+        self.values.extend_from_slice(&values[start..start + len]);
+    }
+
+    #[inline]
+    fn extend_validity(&mut self, additional: usize) {
+        self.values
+            .resize(self.values.len() + additional, T::default());
+        self.validity.extend_constant(additional, false);
+    }
+
+    #[inline]
+    fn len(&self) -> usize {
+        self.values.len()
+    }
+
+    #[inline]
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        Arc::new(self.to())
+    }
+
+    #[inline]
+    fn as_box(&mut self) -> Box<dyn Array> {
+        Box::new(self.to())
+    }
+}
+
+impl<'a, T: NativeType> From<GrowablePrimitive<'a, T>> for PrimitiveArray<T> {
+    #[inline]
+    fn from(val: GrowablePrimitive<'a, T>) -> Self {
+        PrimitiveArray::<T>::new(val.data_type, val.values.into(), val.validity.into())
+    }
+}
diff --git a/crates/nano-arrow/src/array/growable/structure.rs b/crates/nano-arrow/src/array/growable/structure.rs
new file mode 100644
index 000000000000..10afd20e7f06
--- /dev/null
+++ b/crates/nano-arrow/src/array/growable/structure.rs
@@ -0,0 +1,132 @@
+use std::sync::Arc;
+
+use super::utils::{build_extend_null_bits, ExtendNullBits};
+use super::{make_growable, Growable};
+use crate::array::{Array, StructArray};
+use crate::bitmap::MutableBitmap;
+
+/// Concrete [`Growable`] for the [`StructArray`].
+pub struct GrowableStruct<'a> {
+    arrays: Vec<&'a StructArray>,
+    validity: MutableBitmap,
+    values: Vec<Box<dyn Growable<'a> + 'a>>,
+    extend_null_bits: Vec<ExtendNullBits<'a>>,
+}
+
+impl<'a> GrowableStruct<'a> {
+    /// Creates a new [`GrowableStruct`] bound to `arrays` with a pre-allocated `capacity`.
+    /// # Panics
+    /// If `arrays` is empty.
+    pub fn new(arrays: Vec<&'a StructArray>, mut use_validity: bool, capacity: usize) -> Self {
+        assert!(!arrays.is_empty());
+
+        // if any of the arrays has nulls, insertions from any array requires setting bits
+        // as there is at least one array with nulls.
+        if arrays.iter().any(|array| array.null_count() > 0) {
+            use_validity = true;
+        };
+
+        let extend_null_bits = arrays
+            .iter()
+            .map(|array| build_extend_null_bits(*array, use_validity))
+            .collect();
+
+        let arrays = arrays
+            .iter()
+            .map(|array| array.as_any().downcast_ref::<StructArray>().unwrap())
+            .collect::<Vec<_>>();
+
+        // ([field1, field2], [field3, field4]) -> ([field1, field3], [field2, field3])
+        let values = (0..arrays[0].values().len())
+            .map(|i| {
+                make_growable(
+                    &arrays
+                        .iter()
+                        .map(|x| x.values()[i].as_ref())
+                        .collect::<Vec<_>>(),
+                    use_validity,
+                    capacity,
+                )
+            })
+            .collect::<Vec<Box<dyn Growable>>>();
+
+        Self {
+            arrays,
+            values,
+            validity: MutableBitmap::with_capacity(capacity),
+            extend_null_bits,
+        }
+    }
+
+    fn to(&mut self) -> StructArray {
+        let validity = std::mem::take(&mut self.validity);
+        let values = std::mem::take(&mut self.values);
+        let values = values.into_iter().map(|mut x| x.as_box()).collect();
+
+        StructArray::new(self.arrays[0].data_type().clone(), values, validity.into())
+    }
+}
+
+impl<'a> Growable<'a> for GrowableStruct<'a> {
+    fn extend(&mut self, index: usize, start: usize, len: usize) {
+        (self.extend_null_bits[index])(&mut self.validity, start, len);
+
+        let array = self.arrays[index];
+        if array.null_count() == 0 {
+            self.values
+                .iter_mut()
+                .for_each(|child| child.extend(index, start, len))
+        } else {
+            (start..start + len).for_each(|i| {
+                if array.is_valid(i) {
+                    self.values
+                        .iter_mut()
+                        .for_each(|child| child.extend(index, i, 1))
+                } else {
+                    self.values
+                        .iter_mut()
+                        .for_each(|child| child.extend_validity(1))
+                }
+            })
+        }
+    }
+
+    fn extend_validity(&mut self, additional: usize) {
+        self.values
+            .iter_mut()
+            .for_each(|child| child.extend_validity(additional));
+        self.validity.extend_constant(additional, false);
+    }
+
+    #[inline]
+    fn len(&self) -> usize {
+        // All children should have the same indexing, so just use the first
+        // one. If we don't have children, we might still have a validity
+        // array, so use that.
+        if let Some(child) = self.values.get(0) {
+            child.len()
+        } else {
+            self.validity.len()
+        }
+    }
+
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        Arc::new(self.to())
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        Box::new(self.to())
+    }
+}
+
+impl<'a> From<GrowableStruct<'a>> for StructArray {
+    fn from(val: GrowableStruct<'a>) -> Self {
+        let values = val.values.into_iter().map(|mut x| x.as_box()).collect();
+
+        StructArray::new(
+            val.arrays[0].data_type().clone(),
+            values,
+            val.validity.into(),
+        )
+    }
+}
diff --git a/crates/nano-arrow/src/array/growable/union.rs b/crates/nano-arrow/src/array/growable/union.rs
new file mode 100644
index 000000000000..4ef39f16fbb3
--- /dev/null
+++ b/crates/nano-arrow/src/array/growable/union.rs
@@ -0,0 +1,120 @@
+use std::sync::Arc;
+
+use super::{make_growable, Growable};
+use crate::array::{Array, UnionArray};
+
+/// Concrete [`Growable`] for the [`UnionArray`].
+pub struct GrowableUnion<'a> {
+    arrays: Vec<&'a UnionArray>,
+    types: Vec<i8>,
+    offsets: Option<Vec<i32>>,
+    fields: Vec<Box<dyn Growable<'a> + 'a>>,
+}
+
+impl<'a> GrowableUnion<'a> {
+    /// Creates a new [`GrowableUnion`] bound to `arrays` with a pre-allocated `capacity`.
+    /// # Panics
+    /// Panics iff
+    /// * `arrays` is empty.
+    /// * any of the arrays has a different
+    pub fn new(arrays: Vec<&'a UnionArray>, capacity: usize) -> Self {
+        let first = arrays[0].data_type();
+        assert!(arrays.iter().all(|x| x.data_type() == first));
+
+        let has_offsets = arrays[0].offsets().is_some();
+
+        let fields = (0..arrays[0].fields().len())
+            .map(|i| {
+                make_growable(
+                    &arrays
+                        .iter()
+                        .map(|x| x.fields()[i].as_ref())
+                        .collect::<Vec<_>>(),
+                    false,
+                    capacity,
+                )
+            })
+            .collect::<Vec<Box<dyn Growable>>>();
+
+        Self {
+            arrays,
+            fields,
+            offsets: if has_offsets {
+                Some(Vec::with_capacity(capacity))
+            } else {
+                None
+            },
+            types: Vec::with_capacity(capacity),
+        }
+    }
+
+    fn to(&mut self) -> UnionArray {
+        let types = std::mem::take(&mut self.types);
+        let fields = std::mem::take(&mut self.fields);
+        let offsets = std::mem::take(&mut self.offsets);
+        let fields = fields.into_iter().map(|mut x| x.as_box()).collect();
+
+        UnionArray::new(
+            self.arrays[0].data_type().clone(),
+            types.into(),
+            fields,
+            offsets.map(|x| x.into()),
+        )
+    }
+}
+
+impl<'a> Growable<'a> for GrowableUnion<'a> {
+    fn extend(&mut self, index: usize, start: usize, len: usize) {
+        let array = self.arrays[index];
+
+        let types = &array.types()[start..start + len];
+        self.types.extend(types);
+        if let Some(x) = self.offsets.as_mut() {
+            let offsets = &array.offsets().unwrap()[start..start + len];
+
+            // in a dense union, each slot has its own offset. We extend the fields accordingly.
+            for (&type_, &offset) in types.iter().zip(offsets.iter()) {
+                let field = &mut self.fields[type_ as usize];
+                // The offset for the element that is about to be extended is the current length
+                // of the child field of the corresponding type. Note that this may be very
+                // different than the original offset from the array we are extending from as
+                // it is a function of the previous extensions to this child.
+                x.push(field.len() as i32);
+                field.extend(index, offset as usize, 1);
+            }
+        } else {
+            // in a sparse union, every field has the same length => extend all fields equally
+            self.fields
+                .iter_mut()
+                .for_each(|field| field.extend(index, start, len))
+        }
+    }
+
+    fn extend_validity(&mut self, _additional: usize) {}
+
+    #[inline]
+    fn len(&self) -> usize {
+        self.types.len()
+    }
+
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        self.to().arced()
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        self.to().boxed()
+    }
+}
+
+impl<'a> From<GrowableUnion<'a>> for UnionArray {
+    fn from(val: GrowableUnion<'a>) -> Self {
+        let fields = val.fields.into_iter().map(|mut x| x.as_box()).collect();
+
+        UnionArray::new(
+            val.arrays[0].data_type().clone(),
+            val.types.into(),
+            fields,
+            val.offsets.map(|x| x.into()),
+        )
+    }
+}
diff --git a/crates/nano-arrow/src/array/growable/utf8.rs b/crates/nano-arrow/src/array/growable/utf8.rs
new file mode 100644
index 000000000000..1ea01ffd040a
--- /dev/null
+++ b/crates/nano-arrow/src/array/growable/utf8.rs
@@ -0,0 +1,104 @@
+use std::sync::Arc;
+
+use super::utils::{build_extend_null_bits, extend_offset_values, ExtendNullBits};
+use super::Growable;
+use crate::array::{Array, Utf8Array};
+use crate::bitmap::MutableBitmap;
+use crate::offset::{Offset, Offsets};
+
+/// Concrete [`Growable`] for the [`Utf8Array`].
+pub struct GrowableUtf8<'a, O: Offset> {
+    arrays: Vec<&'a Utf8Array<O>>,
+    validity: MutableBitmap,
+    values: Vec<u8>,
+    offsets: Offsets<O>,
+    extend_null_bits: Vec<ExtendNullBits<'a>>,
+}
+
+impl<'a, O: Offset> GrowableUtf8<'a, O> {
+    /// Creates a new [`GrowableUtf8`] bound to `arrays` with a pre-allocated `capacity`.
+    /// # Panics
+    /// If `arrays` is empty.
+    pub fn new(arrays: Vec<&'a Utf8Array<O>>, mut use_validity: bool, capacity: usize) -> Self {
+        // if any of the arrays has nulls, insertions from any array requires setting bits
+        // as there is at least one array with nulls.
+        if arrays.iter().any(|array| array.null_count() > 0) {
+            use_validity = true;
+        };
+
+        let extend_null_bits = arrays
+            .iter()
+            .map(|array| build_extend_null_bits(*array, use_validity))
+            .collect();
+
+        Self {
+            arrays: arrays.to_vec(),
+            values: Vec::with_capacity(0),
+            offsets: Offsets::with_capacity(capacity),
+            validity: MutableBitmap::with_capacity(capacity),
+            extend_null_bits,
+        }
+    }
+
+    fn to(&mut self) -> Utf8Array<O> {
+        let validity = std::mem::take(&mut self.validity);
+        let offsets = std::mem::take(&mut self.offsets);
+        let values = std::mem::take(&mut self.values);
+
+        #[cfg(debug_assertions)]
+        {
+            crate::array::specification::try_check_utf8(&offsets, &values).unwrap();
+        }
+
+        unsafe {
+            Utf8Array::<O>::try_new_unchecked(
+                self.arrays[0].data_type().clone(),
+                offsets.into(),
+                values.into(),
+                validity.into(),
+            )
+            .unwrap()
+        }
+    }
+}
+
+impl<'a, O: Offset> Growable<'a> for GrowableUtf8<'a, O> {
+    fn extend(&mut self, index: usize, start: usize, len: usize) {
+        (self.extend_null_bits[index])(&mut self.validity, start, len);
+
+        let array = self.arrays[index];
+        let offsets = array.offsets();
+        let values = array.values();
+
+        self.offsets
+            .try_extend_from_slice(offsets, start, len)
+            .unwrap();
+
+        // values
+        extend_offset_values::<O>(&mut self.values, offsets.as_slice(), values, start, len);
+    }
+
+    fn extend_validity(&mut self, additional: usize) {
+        self.offsets.extend_constant(additional);
+        self.validity.extend_constant(additional, false);
+    }
+
+    #[inline]
+    fn len(&self) -> usize {
+        self.offsets.len() - 1
+    }
+
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        Arc::new(self.to())
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        Box::new(self.to())
+    }
+}
+
+impl<'a, O: Offset> From<GrowableUtf8<'a, O>> for Utf8Array<O> {
+    fn from(mut val: GrowableUtf8<'a, O>) -> Self {
+        val.to()
+    }
+}
diff --git a/crates/nano-arrow/src/array/growable/utils.rs b/crates/nano-arrow/src/array/growable/utils.rs
new file mode 100644
index 000000000000..ecdfb522249f
--- /dev/null
+++ b/crates/nano-arrow/src/array/growable/utils.rs
@@ -0,0 +1,40 @@
+use crate::array::Array;
+use crate::bitmap::MutableBitmap;
+use crate::offset::Offset;
+
+// function used to extend nulls from arrays. This function's lifetime is bound to the array
+// because it reads nulls from it.
+pub(super) type ExtendNullBits<'a> = Box<dyn Fn(&mut MutableBitmap, usize, usize) + 'a>;
+
+pub(super) fn build_extend_null_bits(array: &dyn Array, use_validity: bool) -> ExtendNullBits {
+    if let Some(bitmap) = array.validity() {
+        Box::new(move |validity, start, len| {
+            debug_assert!(start + len <= bitmap.len());
+            let (slice, offset, _) = bitmap.as_slice();
+            // safety: invariant offset + length <= slice.len()
+            unsafe {
+                validity.extend_from_slice_unchecked(slice, start + offset, len);
+            }
+        })
+    } else if use_validity {
+        Box::new(|validity, _, len| {
+            validity.extend_constant(len, true);
+        })
+    } else {
+        Box::new(|_, _, _| {})
+    }
+}
+
+#[inline]
+pub(super) fn extend_offset_values<O: Offset>(
+    buffer: &mut Vec<u8>,
+    offsets: &[O],
+    values: &[u8],
+    start: usize,
+    len: usize,
+) {
+    let start_values = offsets[start].to_usize();
+    let end_values = offsets[start + len].to_usize();
+    let new_values = &values[start_values..end_values];
+    buffer.extend_from_slice(new_values);
+}
diff --git a/crates/nano-arrow/src/array/indexable.rs b/crates/nano-arrow/src/array/indexable.rs
new file mode 100644
index 000000000000..d3f466722aa6
--- /dev/null
+++ b/crates/nano-arrow/src/array/indexable.rs
@@ -0,0 +1,194 @@
+use std::borrow::Borrow;
+
+use crate::array::{
+    MutableArray, MutableBinaryArray, MutableBinaryValuesArray, MutableBooleanArray,
+    MutableFixedSizeBinaryArray, MutablePrimitiveArray, MutableUtf8Array, MutableUtf8ValuesArray,
+};
+use crate::offset::Offset;
+use crate::types::NativeType;
+
+/// Trait for arrays that can be indexed directly to extract a value.
+pub trait Indexable {
+    /// The type of the element at index `i`; may be a reference type or a value type.
+    type Value<'a>: Borrow<Self::Type>
+    where
+        Self: 'a;
+
+    type Type: ?Sized;
+
+    /// Returns the element at index `i`.
+    /// # Panic
+    /// May panic if `i >= self.len()`.
+    fn value_at(&self, index: usize) -> Self::Value<'_>;
+
+    /// Returns the element at index `i`.
+    /// # Safety
+    /// Assumes that the `i < self.len`.
+    #[inline]
+    unsafe fn value_unchecked_at(&self, index: usize) -> Self::Value<'_> {
+        self.value_at(index)
+    }
+}
+
+pub trait AsIndexed<M: Indexable> {
+    fn as_indexed(&self) -> &M::Type;
+}
+
+impl Indexable for MutableBooleanArray {
+    type Value<'a> = bool;
+    type Type = bool;
+
+    #[inline]
+    fn value_at(&self, i: usize) -> Self::Value<'_> {
+        self.values().get(i)
+    }
+}
+
+impl AsIndexed<MutableBooleanArray> for bool {
+    #[inline]
+    fn as_indexed(&self) -> &bool {
+        self
+    }
+}
+
+impl<O: Offset> Indexable for MutableBinaryArray<O> {
+    type Value<'a> = &'a [u8];
+    type Type = [u8];
+
+    #[inline]
+    fn value_at(&self, i: usize) -> Self::Value<'_> {
+        // TODO: add .value() / .value_unchecked() to MutableBinaryArray?
+        assert!(i < self.len());
+        unsafe { self.value_unchecked_at(i) }
+    }
+
+    #[inline]
+    unsafe fn value_unchecked_at(&self, i: usize) -> Self::Value<'_> {
+        // TODO: add .value() / .value_unchecked() to MutableBinaryArray?
+        // soundness: the invariant of the function
+        let (start, end) = self.offsets().start_end_unchecked(i);
+        // soundness: the invariant of the struct
+        self.values().get_unchecked(start..end)
+    }
+}
+
+impl<O: Offset> AsIndexed<MutableBinaryArray<O>> for &[u8] {
+    #[inline]
+    fn as_indexed(&self) -> &[u8] {
+        self
+    }
+}
+
+impl<O: Offset> Indexable for MutableBinaryValuesArray<O> {
+    type Value<'a> = &'a [u8];
+    type Type = [u8];
+
+    #[inline]
+    fn value_at(&self, i: usize) -> Self::Value<'_> {
+        self.value(i)
+    }
+
+    #[inline]
+    unsafe fn value_unchecked_at(&self, i: usize) -> Self::Value<'_> {
+        self.value_unchecked(i)
+    }
+}
+
+impl<O: Offset> AsIndexed<MutableBinaryValuesArray<O>> for &[u8] {
+    #[inline]
+    fn as_indexed(&self) -> &[u8] {
+        self
+    }
+}
+
+impl Indexable for MutableFixedSizeBinaryArray {
+    type Value<'a> = &'a [u8];
+    type Type = [u8];
+
+    #[inline]
+    fn value_at(&self, i: usize) -> Self::Value<'_> {
+        self.value(i)
+    }
+
+    #[inline]
+    unsafe fn value_unchecked_at(&self, i: usize) -> Self::Value<'_> {
+        // soundness: the invariant of the struct
+        self.value_unchecked(i)
+    }
+}
+
+impl AsIndexed<MutableFixedSizeBinaryArray> for &[u8] {
+    #[inline]
+    fn as_indexed(&self) -> &[u8] {
+        self
+    }
+}
+
+// TODO: should NativeType derive from Hash?
+impl<T: NativeType> Indexable for MutablePrimitiveArray<T> {
+    type Value<'a> = T;
+    type Type = T;
+
+    #[inline]
+    fn value_at(&self, i: usize) -> Self::Value<'_> {
+        assert!(i < self.len());
+        // TODO: add Length trait? (for both Array and MutableArray)
+        unsafe { self.value_unchecked_at(i) }
+    }
+
+    #[inline]
+    unsafe fn value_unchecked_at(&self, i: usize) -> Self::Value<'_> {
+        *self.values().get_unchecked(i)
+    }
+}
+
+impl<T: NativeType> AsIndexed<MutablePrimitiveArray<T>> for T {
+    #[inline]
+    fn as_indexed(&self) -> &T {
+        self
+    }
+}
+
+impl<O: Offset> Indexable for MutableUtf8Array<O> {
+    type Value<'a> = &'a str;
+    type Type = str;
+
+    #[inline]
+    fn value_at(&self, i: usize) -> Self::Value<'_> {
+        self.value(i)
+    }
+
+    #[inline]
+    unsafe fn value_unchecked_at(&self, i: usize) -> Self::Value<'_> {
+        self.value_unchecked(i)
+    }
+}
+
+impl<O: Offset, V: AsRef<str>> AsIndexed<MutableUtf8Array<O>> for V {
+    #[inline]
+    fn as_indexed(&self) -> &str {
+        self.as_ref()
+    }
+}
+
+impl<O: Offset> Indexable for MutableUtf8ValuesArray<O> {
+    type Value<'a> = &'a str;
+    type Type = str;
+
+    #[inline]
+    fn value_at(&self, i: usize) -> Self::Value<'_> {
+        self.value(i)
+    }
+
+    #[inline]
+    unsafe fn value_unchecked_at(&self, i: usize) -> Self::Value<'_> {
+        self.value_unchecked(i)
+    }
+}
+
+impl<O: Offset, V: AsRef<str>> AsIndexed<MutableUtf8ValuesArray<O>> for V {
+    #[inline]
+    fn as_indexed(&self) -> &str {
+        self.as_ref()
+    }
+}
diff --git a/crates/nano-arrow/src/array/iterator.rs b/crates/nano-arrow/src/array/iterator.rs
new file mode 100644
index 000000000000..5e8ed44d861e
--- /dev/null
+++ b/crates/nano-arrow/src/array/iterator.rs
@@ -0,0 +1,83 @@
+use crate::trusted_len::TrustedLen;
+
+mod private {
+    pub trait Sealed {}
+
+    impl<'a, T: super::ArrayAccessor<'a>> Sealed for T {}
+}
+
+/// Sealed trait representing assess to a value of an array.
+/// # Safety
+/// Implementers of this trait guarantee that
+/// `value_unchecked` is safe when called up to `len`
+pub unsafe trait ArrayAccessor<'a>: private::Sealed {
+    type Item: 'a;
+    unsafe fn value_unchecked(&'a self, index: usize) -> Self::Item;
+    fn len(&self) -> usize;
+}
+
+/// Iterator of values of an [`ArrayAccessor`].
+#[derive(Debug, Clone)]
+pub struct ArrayValuesIter<'a, A: ArrayAccessor<'a>> {
+    array: &'a A,
+    index: usize,
+    end: usize,
+}
+
+impl<'a, A: ArrayAccessor<'a>> ArrayValuesIter<'a, A> {
+    /// Creates a new [`ArrayValuesIter`]
+    #[inline]
+    pub fn new(array: &'a A) -> Self {
+        Self {
+            array,
+            index: 0,
+            end: array.len(),
+        }
+    }
+}
+
+impl<'a, A: ArrayAccessor<'a>> Iterator for ArrayValuesIter<'a, A> {
+    type Item = A::Item;
+
+    #[inline]
+    fn next(&mut self) -> Option<Self::Item> {
+        if self.index == self.end {
+            return None;
+        }
+        let old = self.index;
+        self.index += 1;
+        Some(unsafe { self.array.value_unchecked(old) })
+    }
+
+    #[inline]
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        (self.end - self.index, Some(self.end - self.index))
+    }
+
+    #[inline]
+    fn nth(&mut self, n: usize) -> Option<Self::Item> {
+        let new_index = self.index + n;
+        if new_index > self.end {
+            self.index = self.end;
+            None
+        } else {
+            self.index = new_index;
+            self.next()
+        }
+    }
+}
+
+impl<'a, A: ArrayAccessor<'a>> DoubleEndedIterator for ArrayValuesIter<'a, A> {
+    #[inline]
+    fn next_back(&mut self) -> Option<Self::Item> {
+        if self.index == self.end {
+            None
+        } else {
+            self.end -= 1;
+            Some(unsafe { self.array.value_unchecked(self.end) })
+        }
+    }
+}
+
+unsafe impl<'a, A: ArrayAccessor<'a>> TrustedLen for ArrayValuesIter<'a, A> {}
+impl<'a, A: ArrayAccessor<'a>> ExactSizeIterator for ArrayValuesIter<'a, A> {}
diff --git a/crates/nano-arrow/src/array/list/data.rs b/crates/nano-arrow/src/array/list/data.rs
new file mode 100644
index 000000000000..6f3424c96ce6
--- /dev/null
+++ b/crates/nano-arrow/src/array/list/data.rs
@@ -0,0 +1,38 @@
+use arrow_data::{ArrayData, ArrayDataBuilder};
+
+use crate::array::{from_data, to_data, Arrow2Arrow, ListArray};
+use crate::bitmap::Bitmap;
+use crate::offset::{Offset, OffsetsBuffer};
+
+impl<O: Offset> Arrow2Arrow for ListArray<O> {
+    fn to_data(&self) -> ArrayData {
+        let data_type = self.data_type.clone().into();
+
+        let builder = ArrayDataBuilder::new(data_type)
+            .len(self.len())
+            .buffers(vec![self.offsets.clone().into_inner().into()])
+            .nulls(self.validity.as_ref().map(|b| b.clone().into()))
+            .child_data(vec![to_data(self.values.as_ref())]);
+
+        // Safety: Array is valid
+        unsafe { builder.build_unchecked() }
+    }
+
+    fn from_data(data: &ArrayData) -> Self {
+        let data_type = data.data_type().clone().into();
+        if data.is_empty() {
+            // Handle empty offsets
+            return Self::new_empty(data_type);
+        }
+
+        let mut offsets = unsafe { OffsetsBuffer::new_unchecked(data.buffers()[0].clone().into()) };
+        offsets.slice(data.offset(), data.len() + 1);
+
+        Self {
+            data_type,
+            offsets,
+            values: from_data(&data.child_data()[0]),
+            validity: data.nulls().map(|n| Bitmap::from_null_buffer(n.clone())),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/array/list/ffi.rs b/crates/nano-arrow/src/array/list/ffi.rs
new file mode 100644
index 000000000000..487b4ad40128
--- /dev/null
+++ b/crates/nano-arrow/src/array/list/ffi.rs
@@ -0,0 +1,68 @@
+use super::super::ffi::ToFfi;
+use super::super::Array;
+use super::ListArray;
+use crate::array::FromFfi;
+use crate::bitmap::align;
+use crate::error::Result;
+use crate::ffi;
+use crate::offset::{Offset, OffsetsBuffer};
+
+unsafe impl<O: Offset> ToFfi for ListArray<O> {
+    fn buffers(&self) -> Vec<Option<*const u8>> {
+        vec![
+            self.validity.as_ref().map(|x| x.as_ptr()),
+            Some(self.offsets.buffer().as_ptr().cast::<u8>()),
+        ]
+    }
+
+    fn children(&self) -> Vec<Box<dyn Array>> {
+        vec![self.values.clone()]
+    }
+
+    fn offset(&self) -> Option<usize> {
+        let offset = self.offsets.buffer().offset();
+        if let Some(bitmap) = self.validity.as_ref() {
+            if bitmap.offset() == offset {
+                Some(offset)
+            } else {
+                None
+            }
+        } else {
+            Some(offset)
+        }
+    }
+
+    fn to_ffi_aligned(&self) -> Self {
+        let offset = self.offsets.buffer().offset();
+
+        let validity = self.validity.as_ref().map(|bitmap| {
+            if bitmap.offset() == offset {
+                bitmap.clone()
+            } else {
+                align(bitmap, offset)
+            }
+        });
+
+        Self {
+            data_type: self.data_type.clone(),
+            validity,
+            offsets: self.offsets.clone(),
+            values: self.values.clone(),
+        }
+    }
+}
+
+impl<O: Offset, A: ffi::ArrowArrayRef> FromFfi<A> for ListArray<O> {
+    unsafe fn try_from_ffi(array: A) -> Result<Self> {
+        let data_type = array.data_type().clone();
+        let validity = unsafe { array.validity() }?;
+        let offsets = unsafe { array.buffer::<O>(1) }?;
+        let child = unsafe { array.child(0)? };
+        let values = ffi::try_from(child)?;
+
+        // assumption that data from FFI is well constructed
+        let offsets = unsafe { OffsetsBuffer::new_unchecked(offsets) };
+
+        Ok(Self::new(data_type, offsets, values, validity))
+    }
+}
diff --git a/crates/nano-arrow/src/array/list/fmt.rs b/crates/nano-arrow/src/array/list/fmt.rs
new file mode 100644
index 000000000000..67dcd6b78786
--- /dev/null
+++ b/crates/nano-arrow/src/array/list/fmt.rs
@@ -0,0 +1,30 @@
+use std::fmt::{Debug, Formatter, Result, Write};
+
+use super::super::fmt::{get_display, write_vec};
+use super::ListArray;
+use crate::offset::Offset;
+
+pub fn write_value<O: Offset, W: Write>(
+    array: &ListArray<O>,
+    index: usize,
+    null: &'static str,
+    f: &mut W,
+) -> Result {
+    let values = array.value(index);
+    let writer = |f: &mut W, index| get_display(values.as_ref(), null)(f, index);
+    write_vec(f, writer, None, values.len(), null, false)
+}
+
+impl<O: Offset> Debug for ListArray<O> {
+    fn fmt(&self, f: &mut Formatter<'_>) -> Result {
+        let writer = |f: &mut Formatter, index| write_value(self, index, "None", f);
+
+        let head = if O::IS_LARGE {
+            "LargeListArray"
+        } else {
+            "ListArray"
+        };
+        write!(f, "{head}")?;
+        write_vec(f, writer, self.validity(), self.len(), "None", false)
+    }
+}
diff --git a/crates/nano-arrow/src/array/list/iterator.rs b/crates/nano-arrow/src/array/list/iterator.rs
new file mode 100644
index 000000000000..28552bf4bb65
--- /dev/null
+++ b/crates/nano-arrow/src/array/list/iterator.rs
@@ -0,0 +1,68 @@
+use super::ListArray;
+use crate::array::{Array, ArrayAccessor, ArrayValuesIter};
+use crate::bitmap::utils::{BitmapIter, ZipValidity};
+use crate::offset::Offset;
+
+unsafe impl<'a, O: Offset> ArrayAccessor<'a> for ListArray<O> {
+    type Item = Box<dyn Array>;
+
+    #[inline]
+    unsafe fn value_unchecked(&'a self, index: usize) -> Self::Item {
+        self.value_unchecked(index)
+    }
+
+    #[inline]
+    fn len(&self) -> usize {
+        self.len()
+    }
+}
+
+/// Iterator of values of a [`ListArray`].
+pub type ListValuesIter<'a, O> = ArrayValuesIter<'a, ListArray<O>>;
+
+type ZipIter<'a, O> = ZipValidity<Box<dyn Array>, ListValuesIter<'a, O>, BitmapIter<'a>>;
+
+impl<'a, O: Offset> IntoIterator for &'a ListArray<O> {
+    type Item = Option<Box<dyn Array>>;
+    type IntoIter = ZipIter<'a, O>;
+
+    fn into_iter(self) -> Self::IntoIter {
+        self.iter()
+    }
+}
+
+impl<'a, O: Offset> ListArray<O> {
+    /// Returns an iterator of `Option<Box<dyn Array>>`
+    pub fn iter(&'a self) -> ZipIter<'a, O> {
+        ZipValidity::new_with_validity(ListValuesIter::new(self), self.validity.as_ref())
+    }
+
+    /// Returns an iterator of `Box<dyn Array>`
+    pub fn values_iter(&'a self) -> ListValuesIter<'a, O> {
+        ListValuesIter::new(self)
+    }
+}
+
+struct Iter<T, I: Iterator<Item = Option<T>>> {
+    current: i32,
+    offsets: std::vec::IntoIter<i32>,
+    values: I,
+}
+
+impl<T, I: Iterator<Item = Option<T>> + Clone> Iterator for Iter<T, I> {
+    type Item = Option<std::iter::Take<std::iter::Skip<I>>>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        let next = self.offsets.next();
+        next.map(|next| {
+            let length = next - self.current;
+            let iter = self
+                .values
+                .clone()
+                .skip(self.current as usize)
+                .take(length as usize);
+            self.current = next;
+            Some(iter)
+        })
+    }
+}
diff --git a/crates/nano-arrow/src/array/list/mod.rs b/crates/nano-arrow/src/array/list/mod.rs
new file mode 100644
index 000000000000..dff4584d0cbf
--- /dev/null
+++ b/crates/nano-arrow/src/array/list/mod.rs
@@ -0,0 +1,240 @@
+use super::specification::try_check_offsets_bounds;
+use super::{new_empty_array, Array};
+use crate::bitmap::Bitmap;
+use crate::datatypes::{DataType, Field};
+use crate::error::Error;
+use crate::offset::{Offset, Offsets, OffsetsBuffer};
+
+#[cfg(feature = "arrow")]
+mod data;
+mod ffi;
+pub(super) mod fmt;
+mod iterator;
+pub use iterator::*;
+mod mutable;
+pub use mutable::*;
+
+/// An [`Array`] semantically equivalent to `Vec<Option<Vec<Option<T>>>>` with Arrow's in-memory.
+#[derive(Clone)]
+pub struct ListArray<O: Offset> {
+    data_type: DataType,
+    offsets: OffsetsBuffer<O>,
+    values: Box<dyn Array>,
+    validity: Option<Bitmap>,
+}
+
+impl<O: Offset> ListArray<O> {
+    /// Creates a new [`ListArray`].
+    ///
+    /// # Errors
+    /// This function returns an error iff:
+    /// * The last offset is not equal to the values' length.
+    /// * the validity's length is not equal to `offsets.len()`.
+    /// * The `data_type`'s [`crate::datatypes::PhysicalType`] is not equal to either [`crate::datatypes::PhysicalType::List`] or [`crate::datatypes::PhysicalType::LargeList`].
+    /// * The `data_type`'s inner field's data type is not equal to `values.data_type`.
+    /// # Implementation
+    /// This function is `O(1)`
+    pub fn try_new(
+        data_type: DataType,
+        offsets: OffsetsBuffer<O>,
+        values: Box<dyn Array>,
+        validity: Option<Bitmap>,
+    ) -> Result<Self, Error> {
+        try_check_offsets_bounds(&offsets, values.len())?;
+
+        if validity
+            .as_ref()
+            .map_or(false, |validity| validity.len() != offsets.len_proxy())
+        {
+            return Err(Error::oos(
+                "validity mask length must match the number of values",
+            ));
+        }
+
+        let child_data_type = Self::try_get_child(&data_type)?.data_type();
+        let values_data_type = values.data_type();
+        if child_data_type != values_data_type {
+            return Err(Error::oos(
+                format!("ListArray's child's DataType must match. However, the expected DataType is {child_data_type:?} while it got {values_data_type:?}."),
+            ));
+        }
+
+        Ok(Self {
+            data_type,
+            offsets,
+            values,
+            validity,
+        })
+    }
+
+    /// Creates a new [`ListArray`].
+    ///
+    /// # Panics
+    /// This function panics iff:
+    /// * The last offset is not equal to the values' length.
+    /// * the validity's length is not equal to `offsets.len()`.
+    /// * The `data_type`'s [`crate::datatypes::PhysicalType`] is not equal to either [`crate::datatypes::PhysicalType::List`] or [`crate::datatypes::PhysicalType::LargeList`].
+    /// * The `data_type`'s inner field's data type is not equal to `values.data_type`.
+    /// # Implementation
+    /// This function is `O(1)`
+    pub fn new(
+        data_type: DataType,
+        offsets: OffsetsBuffer<O>,
+        values: Box<dyn Array>,
+        validity: Option<Bitmap>,
+    ) -> Self {
+        Self::try_new(data_type, offsets, values, validity).unwrap()
+    }
+
+    /// Returns a new empty [`ListArray`].
+    pub fn new_empty(data_type: DataType) -> Self {
+        let values = new_empty_array(Self::get_child_type(&data_type).clone());
+        Self::new(data_type, OffsetsBuffer::default(), values, None)
+    }
+
+    /// Returns a new null [`ListArray`].
+    #[inline]
+    pub fn new_null(data_type: DataType, length: usize) -> Self {
+        let child = Self::get_child_type(&data_type).clone();
+        Self::new(
+            data_type,
+            Offsets::new_zeroed(length).into(),
+            new_empty_array(child),
+            Some(Bitmap::new_zeroed(length)),
+        )
+    }
+}
+
+impl<O: Offset> ListArray<O> {
+    /// Slices this [`ListArray`].
+    /// # Panics
+    /// panics iff `offset + length >= self.len()`
+    pub fn slice(&mut self, offset: usize, length: usize) {
+        assert!(
+            offset + length <= self.len(),
+            "the offset of the new Buffer cannot exceed the existing length"
+        );
+        unsafe { self.slice_unchecked(offset, length) }
+    }
+
+    /// Slices this [`ListArray`].
+    /// # Safety
+    /// The caller must ensure that `offset + length < self.len()`.
+    pub unsafe fn slice_unchecked(&mut self, offset: usize, length: usize) {
+        self.validity.as_mut().and_then(|bitmap| {
+            bitmap.slice_unchecked(offset, length);
+            (bitmap.unset_bits() > 0).then(|| bitmap)
+        });
+        self.offsets.slice_unchecked(offset, length + 1);
+    }
+
+    impl_sliced!();
+    impl_mut_validity!();
+    impl_into_array!();
+}
+
+// Accessors
+impl<O: Offset> ListArray<O> {
+    /// Returns the length of this array
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.offsets.len_proxy()
+    }
+
+    /// Returns the element at index `i`
+    /// # Panic
+    /// Panics iff `i >= self.len()`
+    #[inline]
+    pub fn value(&self, i: usize) -> Box<dyn Array> {
+        assert!(i < self.len());
+        // Safety: invariant of this function
+        unsafe { self.value_unchecked(i) }
+    }
+
+    /// Returns the element at index `i` as &str
+    /// # Safety
+    /// Assumes that the `i < self.len`.
+    #[inline]
+    pub unsafe fn value_unchecked(&self, i: usize) -> Box<dyn Array> {
+        // safety: the invariant of the function
+        let (start, end) = self.offsets.start_end_unchecked(i);
+        let length = end - start;
+
+        // safety: the invariant of the struct
+        self.values.sliced_unchecked(start, length)
+    }
+
+    /// The optional validity.
+    #[inline]
+    pub fn validity(&self) -> Option<&Bitmap> {
+        self.validity.as_ref()
+    }
+
+    /// The offsets [`Buffer`].
+    #[inline]
+    pub fn offsets(&self) -> &OffsetsBuffer<O> {
+        &self.offsets
+    }
+
+    /// The values.
+    #[inline]
+    pub fn values(&self) -> &Box<dyn Array> {
+        &self.values
+    }
+}
+
+impl<O: Offset> ListArray<O> {
+    /// Returns a default [`DataType`]: inner field is named "item" and is nullable
+    pub fn default_datatype(data_type: DataType) -> DataType {
+        let field = Box::new(Field::new("item", data_type, true));
+        if O::IS_LARGE {
+            DataType::LargeList(field)
+        } else {
+            DataType::List(field)
+        }
+    }
+
+    /// Returns a the inner [`Field`]
+    /// # Panics
+    /// Panics iff the logical type is not consistent with this struct.
+    pub fn get_child_field(data_type: &DataType) -> &Field {
+        Self::try_get_child(data_type).unwrap()
+    }
+
+    /// Returns a the inner [`Field`]
+    /// # Errors
+    /// Panics iff the logical type is not consistent with this struct.
+    pub fn try_get_child(data_type: &DataType) -> Result<&Field, Error> {
+        if O::IS_LARGE {
+            match data_type.to_logical_type() {
+                DataType::LargeList(child) => Ok(child.as_ref()),
+                _ => Err(Error::oos("ListArray<i64> expects DataType::LargeList")),
+            }
+        } else {
+            match data_type.to_logical_type() {
+                DataType::List(child) => Ok(child.as_ref()),
+                _ => Err(Error::oos("ListArray<i32> expects DataType::List")),
+            }
+        }
+    }
+
+    /// Returns a the inner [`DataType`]
+    /// # Panics
+    /// Panics iff the logical type is not consistent with this struct.
+    pub fn get_child_type(data_type: &DataType) -> &DataType {
+        Self::get_child_field(data_type).data_type()
+    }
+}
+
+impl<O: Offset> Array for ListArray<O> {
+    impl_common_array!();
+
+    fn validity(&self) -> Option<&Bitmap> {
+        self.validity.as_ref()
+    }
+
+    #[inline]
+    fn with_validity(&self, validity: Option<Bitmap>) -> Box<dyn Array> {
+        Box::new(self.clone().with_validity(validity))
+    }
+}
diff --git a/crates/nano-arrow/src/array/list/mutable.rs b/crates/nano-arrow/src/array/list/mutable.rs
new file mode 100644
index 000000000000..39dc22da3cb0
--- /dev/null
+++ b/crates/nano-arrow/src/array/list/mutable.rs
@@ -0,0 +1,315 @@
+use std::sync::Arc;
+
+use super::ListArray;
+use crate::array::physical_binary::extend_validity;
+use crate::array::{Array, MutableArray, TryExtend, TryExtendFromSelf, TryPush};
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::{DataType, Field};
+use crate::error::{Error, Result};
+use crate::offset::{Offset, Offsets};
+use crate::trusted_len::TrustedLen;
+
+/// The mutable version of [`ListArray`].
+#[derive(Debug, Clone)]
+pub struct MutableListArray<O: Offset, M: MutableArray> {
+    data_type: DataType,
+    offsets: Offsets<O>,
+    values: M,
+    validity: Option<MutableBitmap>,
+}
+
+impl<O: Offset, M: MutableArray + Default> MutableListArray<O, M> {
+    /// Creates a new empty [`MutableListArray`].
+    pub fn new() -> Self {
+        let values = M::default();
+        let data_type = ListArray::<O>::default_datatype(values.data_type().clone());
+        Self::new_from(values, data_type, 0)
+    }
+
+    /// Creates a new [`MutableListArray`] with a capacity.
+    pub fn with_capacity(capacity: usize) -> Self {
+        let values = M::default();
+        let data_type = ListArray::<O>::default_datatype(values.data_type().clone());
+
+        let offsets = Offsets::<O>::with_capacity(capacity);
+        Self {
+            data_type,
+            offsets,
+            values,
+            validity: None,
+        }
+    }
+}
+
+impl<O: Offset, M: MutableArray + Default> Default for MutableListArray<O, M> {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl<O: Offset, M: MutableArray> From<MutableListArray<O, M>> for ListArray<O> {
+    fn from(mut other: MutableListArray<O, M>) -> Self {
+        ListArray::new(
+            other.data_type,
+            other.offsets.into(),
+            other.values.as_box(),
+            other.validity.map(|x| x.into()),
+        )
+    }
+}
+
+impl<O, M, I, T> TryExtend<Option<I>> for MutableListArray<O, M>
+where
+    O: Offset,
+    M: MutableArray + TryExtend<Option<T>>,
+    I: IntoIterator<Item = Option<T>>,
+{
+    fn try_extend<II: IntoIterator<Item = Option<I>>>(&mut self, iter: II) -> Result<()> {
+        let iter = iter.into_iter();
+        self.reserve(iter.size_hint().0);
+        for items in iter {
+            self.try_push(items)?;
+        }
+        Ok(())
+    }
+}
+
+impl<O, M, I, T> TryPush<Option<I>> for MutableListArray<O, M>
+where
+    O: Offset,
+    M: MutableArray + TryExtend<Option<T>>,
+    I: IntoIterator<Item = Option<T>>,
+{
+    #[inline]
+    fn try_push(&mut self, item: Option<I>) -> Result<()> {
+        if let Some(items) = item {
+            let values = self.mut_values();
+            values.try_extend(items)?;
+            self.try_push_valid()?;
+        } else {
+            self.push_null();
+        }
+        Ok(())
+    }
+}
+
+impl<O, M> TryExtendFromSelf for MutableListArray<O, M>
+where
+    O: Offset,
+    M: MutableArray + TryExtendFromSelf,
+{
+    fn try_extend_from_self(&mut self, other: &Self) -> Result<()> {
+        extend_validity(self.len(), &mut self.validity, &other.validity);
+
+        self.values.try_extend_from_self(&other.values)?;
+        self.offsets.try_extend_from_self(&other.offsets)
+    }
+}
+
+impl<O: Offset, M: MutableArray> MutableListArray<O, M> {
+    /// Creates a new [`MutableListArray`] from a [`MutableArray`] and capacity.
+    pub fn new_from(values: M, data_type: DataType, capacity: usize) -> Self {
+        let offsets = Offsets::<O>::with_capacity(capacity);
+        assert_eq!(values.len(), 0);
+        ListArray::<O>::get_child_field(&data_type);
+        Self {
+            data_type,
+            offsets,
+            values,
+            validity: None,
+        }
+    }
+
+    /// Creates a new [`MutableListArray`] from a [`MutableArray`].
+    pub fn new_with_field(values: M, name: &str, nullable: bool) -> Self {
+        let field = Box::new(Field::new(name, values.data_type().clone(), nullable));
+        let data_type = if O::IS_LARGE {
+            DataType::LargeList(field)
+        } else {
+            DataType::List(field)
+        };
+        Self::new_from(values, data_type, 0)
+    }
+
+    /// Creates a new [`MutableListArray`] from a [`MutableArray`] and capacity.
+    pub fn new_with_capacity(values: M, capacity: usize) -> Self {
+        let data_type = ListArray::<O>::default_datatype(values.data_type().clone());
+        Self::new_from(values, data_type, capacity)
+    }
+
+    /// Creates a new [`MutableListArray`] from a [`MutableArray`], [`Offsets`] and
+    /// [`MutableBitmap`].
+    pub fn new_from_mutable(
+        values: M,
+        offsets: Offsets<O>,
+        validity: Option<MutableBitmap>,
+    ) -> Self {
+        assert_eq!(values.len(), offsets.last().to_usize());
+        let data_type = ListArray::<O>::default_datatype(values.data_type().clone());
+        Self {
+            data_type,
+            offsets,
+            values,
+            validity,
+        }
+    }
+
+    #[inline]
+    /// Needs to be called when a valid value was extended to this array.
+    /// This is a relatively low level function, prefer `try_push` when you can.
+    pub fn try_push_valid(&mut self) -> Result<()> {
+        let total_length = self.values.len();
+        let offset = self.offsets.last().to_usize();
+        let length = total_length.checked_sub(offset).ok_or(Error::Overflow)?;
+
+        self.offsets.try_push_usize(length)?;
+        if let Some(validity) = &mut self.validity {
+            validity.push(true)
+        }
+        Ok(())
+    }
+
+    #[inline]
+    fn push_null(&mut self) {
+        self.offsets.extend_constant(1);
+        match &mut self.validity {
+            Some(validity) => validity.push(false),
+            None => self.init_validity(),
+        }
+    }
+
+    /// Expand this array, using elements from the underlying backing array.
+    /// Assumes the expansion begins at the highest previous offset, or zero if
+    /// this [`MutableListArray`] is currently empty.
+    ///
+    /// Panics if:
+    /// - the new offsets are not in monotonic increasing order.
+    /// - any new offset is not in bounds of the backing array.
+    /// - the passed iterator has no upper bound.
+    pub fn try_extend_from_lengths<II>(&mut self, iterator: II) -> Result<()>
+    where
+        II: TrustedLen<Item = Option<usize>> + Clone,
+    {
+        self.offsets
+            .try_extend_from_lengths(iterator.clone().map(|x| x.unwrap_or_default()))?;
+        if let Some(validity) = &mut self.validity {
+            validity.extend_from_trusted_len_iter(iterator.map(|x| x.is_some()))
+        }
+        assert_eq!(self.offsets.last().to_usize(), self.values.len());
+        Ok(())
+    }
+
+    /// Returns the length of this array
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.offsets.len_proxy()
+    }
+
+    /// The values
+    pub fn mut_values(&mut self) -> &mut M {
+        &mut self.values
+    }
+
+    /// The offsets
+    pub fn offsets(&self) -> &Offsets<O> {
+        &self.offsets
+    }
+
+    /// The values
+    pub fn values(&self) -> &M {
+        &self.values
+    }
+
+    fn init_validity(&mut self) {
+        let len = self.offsets.len_proxy();
+
+        let mut validity = MutableBitmap::with_capacity(self.offsets.capacity());
+        validity.extend_constant(len, true);
+        validity.set(len - 1, false);
+        self.validity = Some(validity)
+    }
+
+    /// Converts itself into an [`Array`].
+    pub fn into_arc(self) -> Arc<dyn Array> {
+        let a: ListArray<O> = self.into();
+        Arc::new(a)
+    }
+
+    /// converts itself into [`Box<dyn Array>`]
+    pub fn into_box(self) -> Box<dyn Array> {
+        let a: ListArray<O> = self.into();
+        Box::new(a)
+    }
+
+    /// Reserves `additional` slots.
+    pub fn reserve(&mut self, additional: usize) {
+        self.offsets.reserve(additional);
+        if let Some(x) = self.validity.as_mut() {
+            x.reserve(additional)
+        }
+    }
+
+    /// Shrinks the capacity of the [`MutableListArray`] to fit its current length.
+    pub fn shrink_to_fit(&mut self) {
+        self.values.shrink_to_fit();
+        self.offsets.shrink_to_fit();
+        if let Some(validity) = &mut self.validity {
+            validity.shrink_to_fit()
+        }
+    }
+}
+
+impl<O: Offset, M: MutableArray + 'static> MutableArray for MutableListArray<O, M> {
+    fn len(&self) -> usize {
+        MutableListArray::len(self)
+    }
+
+    fn validity(&self) -> Option<&MutableBitmap> {
+        self.validity.as_ref()
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        ListArray::new(
+            self.data_type.clone(),
+            std::mem::take(&mut self.offsets).into(),
+            self.values.as_box(),
+            std::mem::take(&mut self.validity).map(|x| x.into()),
+        )
+        .boxed()
+    }
+
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        ListArray::new(
+            self.data_type.clone(),
+            std::mem::take(&mut self.offsets).into(),
+            self.values.as_box(),
+            std::mem::take(&mut self.validity).map(|x| x.into()),
+        )
+        .arced()
+    }
+
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    fn as_mut_any(&mut self) -> &mut dyn std::any::Any {
+        self
+    }
+
+    #[inline]
+    fn push_null(&mut self) {
+        self.push_null()
+    }
+
+    fn reserve(&mut self, additional: usize) {
+        self.reserve(additional)
+    }
+
+    fn shrink_to_fit(&mut self) {
+        self.shrink_to_fit();
+    }
+}
diff --git a/crates/nano-arrow/src/array/map/data.rs b/crates/nano-arrow/src/array/map/data.rs
new file mode 100644
index 000000000000..cb8862a4df3d
--- /dev/null
+++ b/crates/nano-arrow/src/array/map/data.rs
@@ -0,0 +1,38 @@
+use arrow_data::{ArrayData, ArrayDataBuilder};
+
+use crate::array::{from_data, to_data, Arrow2Arrow, MapArray};
+use crate::bitmap::Bitmap;
+use crate::offset::OffsetsBuffer;
+
+impl Arrow2Arrow for MapArray {
+    fn to_data(&self) -> ArrayData {
+        let data_type = self.data_type.clone().into();
+
+        let builder = ArrayDataBuilder::new(data_type)
+            .len(self.len())
+            .buffers(vec![self.offsets.clone().into_inner().into()])
+            .nulls(self.validity.as_ref().map(|b| b.clone().into()))
+            .child_data(vec![to_data(self.field.as_ref())]);
+
+        // Safety: Array is valid
+        unsafe { builder.build_unchecked() }
+    }
+
+    fn from_data(data: &ArrayData) -> Self {
+        let data_type = data.data_type().clone().into();
+        if data.is_empty() {
+            // Handle empty offsets
+            return Self::new_empty(data_type);
+        }
+
+        let mut offsets = unsafe { OffsetsBuffer::new_unchecked(data.buffers()[0].clone().into()) };
+        offsets.slice(data.offset(), data.len() + 1);
+
+        Self {
+            data_type: data.data_type().clone().into(),
+            offsets,
+            field: from_data(&data.child_data()[0]),
+            validity: data.nulls().map(|n| Bitmap::from_null_buffer(n.clone())),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/array/map/ffi.rs b/crates/nano-arrow/src/array/map/ffi.rs
new file mode 100644
index 000000000000..9193e7253753
--- /dev/null
+++ b/crates/nano-arrow/src/array/map/ffi.rs
@@ -0,0 +1,68 @@
+use super::super::ffi::ToFfi;
+use super::super::Array;
+use super::MapArray;
+use crate::array::FromFfi;
+use crate::bitmap::align;
+use crate::error::Result;
+use crate::ffi;
+use crate::offset::OffsetsBuffer;
+
+unsafe impl ToFfi for MapArray {
+    fn buffers(&self) -> Vec<Option<*const u8>> {
+        vec![
+            self.validity.as_ref().map(|x| x.as_ptr()),
+            Some(self.offsets.buffer().as_ptr().cast::<u8>()),
+        ]
+    }
+
+    fn children(&self) -> Vec<Box<dyn Array>> {
+        vec![self.field.clone()]
+    }
+
+    fn offset(&self) -> Option<usize> {
+        let offset = self.offsets.buffer().offset();
+        if let Some(bitmap) = self.validity.as_ref() {
+            if bitmap.offset() == offset {
+                Some(offset)
+            } else {
+                None
+            }
+        } else {
+            Some(offset)
+        }
+    }
+
+    fn to_ffi_aligned(&self) -> Self {
+        let offset = self.offsets.buffer().offset();
+
+        let validity = self.validity.as_ref().map(|bitmap| {
+            if bitmap.offset() == offset {
+                bitmap.clone()
+            } else {
+                align(bitmap, offset)
+            }
+        });
+
+        Self {
+            data_type: self.data_type.clone(),
+            validity,
+            offsets: self.offsets.clone(),
+            field: self.field.clone(),
+        }
+    }
+}
+
+impl<A: ffi::ArrowArrayRef> FromFfi<A> for MapArray {
+    unsafe fn try_from_ffi(array: A) -> Result<Self> {
+        let data_type = array.data_type().clone();
+        let validity = unsafe { array.validity() }?;
+        let offsets = unsafe { array.buffer::<i32>(1) }?;
+        let child = array.child(0)?;
+        let values = ffi::try_from(child)?;
+
+        // assumption that data from FFI is well constructed
+        let offsets = unsafe { OffsetsBuffer::new_unchecked(offsets) };
+
+        Self::try_new(data_type, offsets, values, validity)
+    }
+}
diff --git a/crates/nano-arrow/src/array/map/fmt.rs b/crates/nano-arrow/src/array/map/fmt.rs
new file mode 100644
index 000000000000..60abf56e18c5
--- /dev/null
+++ b/crates/nano-arrow/src/array/map/fmt.rs
@@ -0,0 +1,24 @@
+use std::fmt::{Debug, Formatter, Result, Write};
+
+use super::super::fmt::{get_display, write_vec};
+use super::MapArray;
+
+pub fn write_value<W: Write>(
+    array: &MapArray,
+    index: usize,
+    null: &'static str,
+    f: &mut W,
+) -> Result {
+    let values = array.value(index);
+    let writer = |f: &mut W, index| get_display(values.as_ref(), null)(f, index);
+    write_vec(f, writer, None, values.len(), null, false)
+}
+
+impl Debug for MapArray {
+    fn fmt(&self, f: &mut Formatter<'_>) -> Result {
+        let writer = |f: &mut Formatter, index| write_value(self, index, "None", f);
+
+        write!(f, "MapArray")?;
+        write_vec(f, writer, self.validity.as_ref(), self.len(), "None", false)
+    }
+}
diff --git a/crates/nano-arrow/src/array/map/iterator.rs b/crates/nano-arrow/src/array/map/iterator.rs
new file mode 100644
index 000000000000..f424e91b8043
--- /dev/null
+++ b/crates/nano-arrow/src/array/map/iterator.rs
@@ -0,0 +1,81 @@
+use super::MapArray;
+use crate::array::Array;
+use crate::bitmap::utils::{BitmapIter, ZipValidity};
+use crate::trusted_len::TrustedLen;
+
+/// Iterator of values of an [`ListArray`].
+#[derive(Clone, Debug)]
+pub struct MapValuesIter<'a> {
+    array: &'a MapArray,
+    index: usize,
+    end: usize,
+}
+
+impl<'a> MapValuesIter<'a> {
+    #[inline]
+    pub fn new(array: &'a MapArray) -> Self {
+        Self {
+            array,
+            index: 0,
+            end: array.len(),
+        }
+    }
+}
+
+impl<'a> Iterator for MapValuesIter<'a> {
+    type Item = Box<dyn Array>;
+
+    #[inline]
+    fn next(&mut self) -> Option<Self::Item> {
+        if self.index == self.end {
+            return None;
+        }
+        let old = self.index;
+        self.index += 1;
+        // Safety:
+        // self.end is maximized by the length of the array
+        Some(unsafe { self.array.value_unchecked(old) })
+    }
+
+    #[inline]
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        (self.end - self.index, Some(self.end - self.index))
+    }
+}
+
+unsafe impl<'a> TrustedLen for MapValuesIter<'a> {}
+
+impl<'a> DoubleEndedIterator for MapValuesIter<'a> {
+    #[inline]
+    fn next_back(&mut self) -> Option<Self::Item> {
+        if self.index == self.end {
+            None
+        } else {
+            self.end -= 1;
+            // Safety:
+            // self.end is maximized by the length of the array
+            Some(unsafe { self.array.value_unchecked(self.end) })
+        }
+    }
+}
+
+impl<'a> IntoIterator for &'a MapArray {
+    type Item = Option<Box<dyn Array>>;
+    type IntoIter = ZipValidity<Box<dyn Array>, MapValuesIter<'a>, BitmapIter<'a>>;
+
+    fn into_iter(self) -> Self::IntoIter {
+        self.iter()
+    }
+}
+
+impl<'a> MapArray {
+    /// Returns an iterator of `Option<Box<dyn Array>>`
+    pub fn iter(&'a self) -> ZipValidity<Box<dyn Array>, MapValuesIter<'a>, BitmapIter<'a>> {
+        ZipValidity::new_with_validity(MapValuesIter::new(self), self.validity())
+    }
+
+    /// Returns an iterator of `Box<dyn Array>`
+    pub fn values_iter(&'a self) -> MapValuesIter<'a> {
+        MapValuesIter::new(self)
+    }
+}
diff --git a/crates/nano-arrow/src/array/map/mod.rs b/crates/nano-arrow/src/array/map/mod.rs
new file mode 100644
index 000000000000..fca2e3bf68c1
--- /dev/null
+++ b/crates/nano-arrow/src/array/map/mod.rs
@@ -0,0 +1,204 @@
+use super::specification::try_check_offsets_bounds;
+use super::{new_empty_array, Array};
+use crate::bitmap::Bitmap;
+use crate::datatypes::{DataType, Field};
+use crate::error::Error;
+use crate::offset::OffsetsBuffer;
+
+#[cfg(feature = "arrow")]
+mod data;
+mod ffi;
+pub(super) mod fmt;
+mod iterator;
+pub use iterator::*;
+
+/// An array representing a (key, value), both of arbitrary logical types.
+#[derive(Clone)]
+pub struct MapArray {
+    data_type: DataType,
+    // invariant: field.len() == offsets.len()
+    offsets: OffsetsBuffer<i32>,
+    field: Box<dyn Array>,
+    // invariant: offsets.len() - 1 == Bitmap::len()
+    validity: Option<Bitmap>,
+}
+
+impl MapArray {
+    /// Returns a new [`MapArray`].
+    /// # Errors
+    /// This function errors iff:
+    /// * The last offset is not equal to the field' length
+    /// * The `data_type`'s physical type is not [`crate::datatypes::PhysicalType::Map`]
+    /// * The fields' `data_type` is not equal to the inner field of `data_type`
+    /// * The validity is not `None` and its length is different from `offsets.len() - 1`.
+    pub fn try_new(
+        data_type: DataType,
+        offsets: OffsetsBuffer<i32>,
+        field: Box<dyn Array>,
+        validity: Option<Bitmap>,
+    ) -> Result<Self, Error> {
+        try_check_offsets_bounds(&offsets, field.len())?;
+
+        let inner_field = Self::try_get_field(&data_type)?;
+        if let DataType::Struct(inner) = inner_field.data_type() {
+            if inner.len() != 2 {
+                return Err(Error::InvalidArgumentError(
+                    "MapArray's inner `Struct` must have 2 fields (keys and maps)".to_string(),
+                ));
+            }
+        } else {
+            return Err(Error::InvalidArgumentError(
+                "MapArray expects `DataType::Struct` as its inner logical type".to_string(),
+            ));
+        }
+        if field.data_type() != inner_field.data_type() {
+            return Err(Error::InvalidArgumentError(
+                "MapArray expects `field.data_type` to match its inner DataType".to_string(),
+            ));
+        }
+
+        if validity
+            .as_ref()
+            .map_or(false, |validity| validity.len() != offsets.len_proxy())
+        {
+            return Err(Error::oos(
+                "validity mask length must match the number of values",
+            ));
+        }
+
+        Ok(Self {
+            data_type,
+            field,
+            offsets,
+            validity,
+        })
+    }
+
+    /// Creates a new [`MapArray`].
+    /// # Panics
+    /// * The last offset is not equal to the field' length.
+    /// * The `data_type`'s physical type is not [`crate::datatypes::PhysicalType::Map`],
+    /// * The validity is not `None` and its length is different from `offsets.len() - 1`.
+    pub fn new(
+        data_type: DataType,
+        offsets: OffsetsBuffer<i32>,
+        field: Box<dyn Array>,
+        validity: Option<Bitmap>,
+    ) -> Self {
+        Self::try_new(data_type, offsets, field, validity).unwrap()
+    }
+
+    /// Returns a new null [`MapArray`] of `length`.
+    pub fn new_null(data_type: DataType, length: usize) -> Self {
+        let field = new_empty_array(Self::get_field(&data_type).data_type().clone());
+        Self::new(
+            data_type,
+            vec![0i32; 1 + length].try_into().unwrap(),
+            field,
+            Some(Bitmap::new_zeroed(length)),
+        )
+    }
+
+    /// Returns a new empty [`MapArray`].
+    pub fn new_empty(data_type: DataType) -> Self {
+        let field = new_empty_array(Self::get_field(&data_type).data_type().clone());
+        Self::new(data_type, OffsetsBuffer::default(), field, None)
+    }
+}
+
+impl MapArray {
+    /// Returns a slice of this [`MapArray`].
+    /// # Panics
+    /// panics iff `offset + length >= self.len()`
+    pub fn slice(&mut self, offset: usize, length: usize) {
+        assert!(
+            offset + length <= self.len(),
+            "the offset of the new Buffer cannot exceed the existing length"
+        );
+        unsafe { self.slice_unchecked(offset, length) }
+    }
+
+    /// Returns a slice of this [`MapArray`].
+    /// # Safety
+    /// The caller must ensure that `offset + length < self.len()`.
+    #[inline]
+    pub unsafe fn slice_unchecked(&mut self, offset: usize, length: usize) {
+        self.validity.as_mut().and_then(|bitmap| {
+            bitmap.slice_unchecked(offset, length);
+            (bitmap.unset_bits() > 0).then(|| bitmap)
+        });
+        self.offsets.slice_unchecked(offset, length + 1);
+    }
+
+    impl_sliced!();
+    impl_mut_validity!();
+    impl_into_array!();
+
+    pub(crate) fn try_get_field(data_type: &DataType) -> Result<&Field, Error> {
+        if let DataType::Map(field, _) = data_type.to_logical_type() {
+            Ok(field.as_ref())
+        } else {
+            Err(Error::oos(
+                "The data_type's logical type must be DataType::Map",
+            ))
+        }
+    }
+
+    pub(crate) fn get_field(data_type: &DataType) -> &Field {
+        Self::try_get_field(data_type).unwrap()
+    }
+}
+
+// Accessors
+impl MapArray {
+    /// Returns the length of this array
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.offsets.len_proxy()
+    }
+
+    /// returns the offsets
+    #[inline]
+    pub fn offsets(&self) -> &OffsetsBuffer<i32> {
+        &self.offsets
+    }
+
+    /// Returns the field (guaranteed to be a `Struct`)
+    #[inline]
+    pub fn field(&self) -> &Box<dyn Array> {
+        &self.field
+    }
+
+    /// Returns the element at index `i`.
+    #[inline]
+    pub fn value(&self, i: usize) -> Box<dyn Array> {
+        assert!(i < self.len());
+        unsafe { self.value_unchecked(i) }
+    }
+
+    /// Returns the element at index `i`.
+    /// # Safety
+    /// Assumes that the `i < self.len`.
+    #[inline]
+    pub unsafe fn value_unchecked(&self, i: usize) -> Box<dyn Array> {
+        // soundness: the invariant of the function
+        let (start, end) = self.offsets.start_end_unchecked(i);
+        let length = end - start;
+
+        // soundness: the invariant of the struct
+        self.field.sliced_unchecked(start, length)
+    }
+}
+
+impl Array for MapArray {
+    impl_common_array!();
+
+    fn validity(&self) -> Option<&Bitmap> {
+        self.validity.as_ref()
+    }
+
+    #[inline]
+    fn with_validity(&self, validity: Option<Bitmap>) -> Box<dyn Array> {
+        Box::new(self.clone().with_validity(validity))
+    }
+}
diff --git a/crates/nano-arrow/src/array/mod.rs b/crates/nano-arrow/src/array/mod.rs
new file mode 100644
index 000000000000..0d8534fc9e71
--- /dev/null
+++ b/crates/nano-arrow/src/array/mod.rs
@@ -0,0 +1,787 @@
+//! Contains the [`Array`] and [`MutableArray`] trait objects declaring arrays,
+//! as well as concrete arrays (such as [`Utf8Array`] and [`MutableUtf8Array`]).
+//!
+//! Fixed-length containers with optional values
+//! that are laid in memory according to the Arrow specification.
+//! Each array type has its own `struct`. The following are the main array types:
+//! * [`PrimitiveArray`] and [`MutablePrimitiveArray`], an array of values with a fixed length such as integers, floats, etc.
+//! * [`BooleanArray`] and [`MutableBooleanArray`], an array of boolean values (stored as a bitmap)
+//! * [`Utf8Array`] and [`MutableUtf8Array`], an array of variable length utf8 values
+//! * [`BinaryArray`] and [`MutableBinaryArray`], an array of opaque variable length values
+//! * [`ListArray`] and [`MutableListArray`], an array of arrays (e.g. `[[1, 2], None, [], [None]]`)
+//! * [`StructArray`] and [`MutableStructArray`], an array of arrays identified by a string (e.g. `{"a": [1, 2], "b": [true, false]}`)
+//! All immutable arrays implement the trait object [`Array`] and that can be downcasted
+//! to a concrete struct based on [`PhysicalType`](crate::datatypes::PhysicalType) available from [`Array::data_type`].
+//! All immutable arrays are backed by [`Buffer`](crate::buffer::Buffer) and thus cloning and slicing them is `O(1)`.
+//!
+//! Most arrays contain a [`MutableArray`] counterpart that is neither clonable nor sliceable, but
+//! can be operated in-place.
+use std::any::Any;
+use std::sync::Arc;
+
+use crate::bitmap::{Bitmap, MutableBitmap};
+use crate::datatypes::DataType;
+use crate::error::Result;
+
+pub mod physical_binary;
+
+/// A trait representing an immutable Arrow array. Arrow arrays are trait objects
+/// that are infallibly downcasted to concrete types according to the [`Array::data_type`].
+pub trait Array: Send + Sync + dyn_clone::DynClone + 'static {
+    /// Converts itself to a reference of [`Any`], which enables downcasting to concrete types.
+    fn as_any(&self) -> &dyn Any;
+
+    /// Converts itself to a mutable reference of [`Any`], which enables mutable downcasting to concrete types.
+    fn as_any_mut(&mut self) -> &mut dyn Any;
+
+    /// The length of the [`Array`]. Every array has a length corresponding to the number of
+    /// elements (slots).
+    fn len(&self) -> usize;
+
+    /// whether the array is empty
+    fn is_empty(&self) -> bool {
+        self.len() == 0
+    }
+
+    /// The [`DataType`] of the [`Array`]. In combination with [`Array::as_any`], this can be
+    /// used to downcast trait objects (`dyn Array`) to concrete arrays.
+    fn data_type(&self) -> &DataType;
+
+    /// The validity of the [`Array`]: every array has an optional [`Bitmap`] that, when available
+    /// specifies whether the array slot is valid or not (null).
+    /// When the validity is [`None`], all slots are valid.
+    fn validity(&self) -> Option<&Bitmap>;
+
+    /// The number of null slots on this [`Array`].
+    /// # Implementation
+    /// This is `O(1)` since the number of null elements is pre-computed.
+    #[inline]
+    fn null_count(&self) -> usize {
+        if self.data_type() == &DataType::Null {
+            return self.len();
+        };
+        self.validity()
+            .as_ref()
+            .map(|x| x.unset_bits())
+            .unwrap_or(0)
+    }
+
+    /// Returns whether slot `i` is null.
+    /// # Panic
+    /// Panics iff `i >= self.len()`.
+    #[inline]
+    fn is_null(&self, i: usize) -> bool {
+        assert!(i < self.len());
+        unsafe { self.is_null_unchecked(i) }
+    }
+
+    /// Returns whether slot `i` is null.
+    /// # Safety
+    /// The caller must ensure `i < self.len()`
+    #[inline]
+    unsafe fn is_null_unchecked(&self, i: usize) -> bool {
+        self.validity()
+            .as_ref()
+            .map(|x| !x.get_bit_unchecked(i))
+            .unwrap_or(false)
+    }
+
+    /// Returns whether slot `i` is valid.
+    /// # Panic
+    /// Panics iff `i >= self.len()`.
+    #[inline]
+    fn is_valid(&self, i: usize) -> bool {
+        !self.is_null(i)
+    }
+
+    /// Slices this [`Array`].
+    /// # Implementation
+    /// This operation is `O(1)` over `len`.
+    /// # Panic
+    /// This function panics iff `offset + length > self.len()`.
+    fn slice(&mut self, offset: usize, length: usize);
+
+    /// Slices the [`Array`].
+    /// # Implementation
+    /// This operation is `O(1)`.
+    /// # Safety
+    /// The caller must ensure that `offset + length <= self.len()`
+    unsafe fn slice_unchecked(&mut self, offset: usize, length: usize);
+
+    /// Returns a slice of this [`Array`].
+    /// # Implementation
+    /// This operation is `O(1)` over `len`.
+    /// # Panic
+    /// This function panics iff `offset + length > self.len()`.
+    #[must_use]
+    fn sliced(&self, offset: usize, length: usize) -> Box<dyn Array> {
+        let mut new = self.to_boxed();
+        new.slice(offset, length);
+        new
+    }
+
+    /// Returns a slice of this [`Array`].
+    /// # Implementation
+    /// This operation is `O(1)` over `len`, as it amounts to increase two ref counts
+    /// and moving the struct to the heap.
+    /// # Safety
+    /// The caller must ensure that `offset + length <= self.len()`
+    #[must_use]
+    unsafe fn sliced_unchecked(&self, offset: usize, length: usize) -> Box<dyn Array> {
+        let mut new = self.to_boxed();
+        new.slice_unchecked(offset, length);
+        new
+    }
+
+    /// Clones this [`Array`] with a new new assigned bitmap.
+    /// # Panic
+    /// This function panics iff `validity.len() != self.len()`.
+    fn with_validity(&self, validity: Option<Bitmap>) -> Box<dyn Array>;
+
+    /// Clone a `&dyn Array` to an owned `Box<dyn Array>`.
+    fn to_boxed(&self) -> Box<dyn Array>;
+}
+
+dyn_clone::clone_trait_object!(Array);
+
+/// A trait describing an array with a backing store that can be preallocated to
+/// a given size.
+pub(crate) trait Container {
+    /// Create this array with a given capacity.
+    fn with_capacity(capacity: usize) -> Self
+    where
+        Self: Sized;
+}
+
+/// A trait describing a mutable array; i.e. an array whose values can be changed.
+/// Mutable arrays cannot be cloned but can be mutated in place,
+/// thereby making them useful to perform numeric operations without allocations.
+/// As in [`Array`], concrete arrays (such as [`MutablePrimitiveArray`]) implement how they are mutated.
+pub trait MutableArray: std::fmt::Debug + Send + Sync {
+    /// The [`DataType`] of the array.
+    fn data_type(&self) -> &DataType;
+
+    /// The length of the array.
+    fn len(&self) -> usize;
+
+    /// Whether the array is empty.
+    fn is_empty(&self) -> bool {
+        self.len() == 0
+    }
+
+    /// The optional validity of the array.
+    fn validity(&self) -> Option<&MutableBitmap>;
+
+    /// Convert itself to an (immutable) [`Array`].
+    fn as_box(&mut self) -> Box<dyn Array>;
+
+    /// Convert itself to an (immutable) atomically reference counted [`Array`].
+    // This provided implementation has an extra allocation as it first
+    // boxes `self`, then converts the box into an `Arc`. Implementors may wish
+    // to avoid an allocation by skipping the box completely.
+    fn as_arc(&mut self) -> std::sync::Arc<dyn Array> {
+        self.as_box().into()
+    }
+
+    /// Convert to `Any`, to enable dynamic casting.
+    fn as_any(&self) -> &dyn Any;
+
+    /// Convert to mutable `Any`, to enable dynamic casting.
+    fn as_mut_any(&mut self) -> &mut dyn Any;
+
+    /// Adds a new null element to the array.
+    fn push_null(&mut self);
+
+    /// Whether `index` is valid / set.
+    /// # Panic
+    /// Panics if `index >= self.len()`.
+    #[inline]
+    fn is_valid(&self, index: usize) -> bool {
+        self.validity()
+            .as_ref()
+            .map(|x| x.get(index))
+            .unwrap_or(true)
+    }
+
+    /// Reserves additional slots to its capacity.
+    fn reserve(&mut self, additional: usize);
+
+    /// Shrink the array to fit its length.
+    fn shrink_to_fit(&mut self);
+}
+
+impl MutableArray for Box<dyn MutableArray> {
+    fn len(&self) -> usize {
+        self.as_ref().len()
+    }
+
+    fn validity(&self) -> Option<&MutableBitmap> {
+        self.as_ref().validity()
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        self.as_mut().as_box()
+    }
+
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        self.as_mut().as_arc()
+    }
+
+    fn data_type(&self) -> &DataType {
+        self.as_ref().data_type()
+    }
+
+    fn as_any(&self) -> &dyn std::any::Any {
+        self.as_ref().as_any()
+    }
+
+    fn as_mut_any(&mut self) -> &mut dyn std::any::Any {
+        self.as_mut().as_mut_any()
+    }
+
+    #[inline]
+    fn push_null(&mut self) {
+        self.as_mut().push_null()
+    }
+
+    fn shrink_to_fit(&mut self) {
+        self.as_mut().shrink_to_fit();
+    }
+
+    fn reserve(&mut self, additional: usize) {
+        self.as_mut().reserve(additional);
+    }
+}
+
+macro_rules! general_dyn {
+    ($array:expr, $ty:ty, $f:expr) => {{
+        let array = $array.as_any().downcast_ref::<$ty>().unwrap();
+        ($f)(array)
+    }};
+}
+
+macro_rules! fmt_dyn {
+    ($array:expr, $ty:ty, $f:expr) => {{
+        let mut f = |x: &$ty| x.fmt($f);
+        general_dyn!($array, $ty, f)
+    }};
+}
+
+macro_rules! match_integer_type {(
+    $key_type:expr, | $_:tt $T:ident | $($body:tt)*
+) => ({
+    macro_rules! __with_ty__ {( $_ $T:ident ) => ( $($body)* )}
+    use crate::datatypes::IntegerType::*;
+    match $key_type {
+        Int8 => __with_ty__! { i8 },
+        Int16 => __with_ty__! { i16 },
+        Int32 => __with_ty__! { i32 },
+        Int64 => __with_ty__! { i64 },
+        UInt8 => __with_ty__! { u8 },
+        UInt16 => __with_ty__! { u16 },
+        UInt32 => __with_ty__! { u32 },
+        UInt64 => __with_ty__! { u64 },
+    }
+})}
+
+macro_rules! with_match_primitive_type {(
+    $key_type:expr, | $_:tt $T:ident | $($body:tt)*
+) => ({
+    macro_rules! __with_ty__ {( $_ $T:ident ) => ( $($body)* )}
+    use crate::datatypes::PrimitiveType::*;
+    use crate::types::{days_ms, months_days_ns, f16, i256};
+    match $key_type {
+        Int8 => __with_ty__! { i8 },
+        Int16 => __with_ty__! { i16 },
+        Int32 => __with_ty__! { i32 },
+        Int64 => __with_ty__! { i64 },
+        Int128 => __with_ty__! { i128 },
+        Int256 => __with_ty__! { i256 },
+        DaysMs => __with_ty__! { days_ms },
+        MonthDayNano => __with_ty__! { months_days_ns },
+        UInt8 => __with_ty__! { u8 },
+        UInt16 => __with_ty__! { u16 },
+        UInt32 => __with_ty__! { u32 },
+        UInt64 => __with_ty__! { u64 },
+        Float16 => __with_ty__! { f16 },
+        Float32 => __with_ty__! { f32 },
+        Float64 => __with_ty__! { f64 },
+    }
+})}
+
+impl std::fmt::Debug for dyn Array + '_ {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        use crate::datatypes::PhysicalType::*;
+        match self.data_type().to_physical_type() {
+            Null => fmt_dyn!(self, NullArray, f),
+            Boolean => fmt_dyn!(self, BooleanArray, f),
+            Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+                fmt_dyn!(self, PrimitiveArray<$T>, f)
+            }),
+            Binary => fmt_dyn!(self, BinaryArray<i32>, f),
+            LargeBinary => fmt_dyn!(self, BinaryArray<i64>, f),
+            FixedSizeBinary => fmt_dyn!(self, FixedSizeBinaryArray, f),
+            Utf8 => fmt_dyn!(self, Utf8Array::<i32>, f),
+            LargeUtf8 => fmt_dyn!(self, Utf8Array::<i64>, f),
+            List => fmt_dyn!(self, ListArray::<i32>, f),
+            LargeList => fmt_dyn!(self, ListArray::<i64>, f),
+            FixedSizeList => fmt_dyn!(self, FixedSizeListArray, f),
+            Struct => fmt_dyn!(self, StructArray, f),
+            Union => fmt_dyn!(self, UnionArray, f),
+            Dictionary(key_type) => {
+                match_integer_type!(key_type, |$T| {
+                    fmt_dyn!(self, DictionaryArray::<$T>, f)
+                })
+            },
+            Map => fmt_dyn!(self, MapArray, f),
+        }
+    }
+}
+
+/// Creates a new [`Array`] with a [`Array::len`] of 0.
+pub fn new_empty_array(data_type: DataType) -> Box<dyn Array> {
+    use crate::datatypes::PhysicalType::*;
+    match data_type.to_physical_type() {
+        Null => Box::new(NullArray::new_empty(data_type)),
+        Boolean => Box::new(BooleanArray::new_empty(data_type)),
+        Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+            Box::new(PrimitiveArray::<$T>::new_empty(data_type))
+        }),
+        Binary => Box::new(BinaryArray::<i32>::new_empty(data_type)),
+        LargeBinary => Box::new(BinaryArray::<i64>::new_empty(data_type)),
+        FixedSizeBinary => Box::new(FixedSizeBinaryArray::new_empty(data_type)),
+        Utf8 => Box::new(Utf8Array::<i32>::new_empty(data_type)),
+        LargeUtf8 => Box::new(Utf8Array::<i64>::new_empty(data_type)),
+        List => Box::new(ListArray::<i32>::new_empty(data_type)),
+        LargeList => Box::new(ListArray::<i64>::new_empty(data_type)),
+        FixedSizeList => Box::new(FixedSizeListArray::new_empty(data_type)),
+        Struct => Box::new(StructArray::new_empty(data_type)),
+        Union => Box::new(UnionArray::new_empty(data_type)),
+        Map => Box::new(MapArray::new_empty(data_type)),
+        Dictionary(key_type) => {
+            match_integer_type!(key_type, |$T| {
+                Box::new(DictionaryArray::<$T>::new_empty(data_type))
+            })
+        },
+    }
+}
+
+/// Creates a new [`Array`] of [`DataType`] `data_type` and `length`.
+/// The array is guaranteed to have [`Array::null_count`] equal to [`Array::len`]
+/// for all types except Union, which does not have a validity.
+pub fn new_null_array(data_type: DataType, length: usize) -> Box<dyn Array> {
+    use crate::datatypes::PhysicalType::*;
+    match data_type.to_physical_type() {
+        Null => Box::new(NullArray::new_null(data_type, length)),
+        Boolean => Box::new(BooleanArray::new_null(data_type, length)),
+        Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+            Box::new(PrimitiveArray::<$T>::new_null(data_type, length))
+        }),
+        Binary => Box::new(BinaryArray::<i32>::new_null(data_type, length)),
+        LargeBinary => Box::new(BinaryArray::<i64>::new_null(data_type, length)),
+        FixedSizeBinary => Box::new(FixedSizeBinaryArray::new_null(data_type, length)),
+        Utf8 => Box::new(Utf8Array::<i32>::new_null(data_type, length)),
+        LargeUtf8 => Box::new(Utf8Array::<i64>::new_null(data_type, length)),
+        List => Box::new(ListArray::<i32>::new_null(data_type, length)),
+        LargeList => Box::new(ListArray::<i64>::new_null(data_type, length)),
+        FixedSizeList => Box::new(FixedSizeListArray::new_null(data_type, length)),
+        Struct => Box::new(StructArray::new_null(data_type, length)),
+        Union => Box::new(UnionArray::new_null(data_type, length)),
+        Map => Box::new(MapArray::new_null(data_type, length)),
+        Dictionary(key_type) => {
+            match_integer_type!(key_type, |$T| {
+                Box::new(DictionaryArray::<$T>::new_null(data_type, length))
+            })
+        },
+    }
+}
+
+/// Trait providing bi-directional conversion between arrow2 [`Array`] and arrow-rs [`ArrayData`]
+///
+/// [`ArrayData`]: arrow_data::ArrayData
+#[cfg(feature = "arrow")]
+pub trait Arrow2Arrow: Array {
+    /// Convert this [`Array`] into [`ArrayData`]
+    fn to_data(&self) -> arrow_data::ArrayData;
+
+    /// Create this [`Array`] from [`ArrayData`]
+    fn from_data(data: &arrow_data::ArrayData) -> Self;
+}
+
+#[cfg(feature = "arrow")]
+macro_rules! to_data_dyn {
+    ($array:expr, $ty:ty) => {{
+        let f = |x: &$ty| x.to_data();
+        general_dyn!($array, $ty, f)
+    }};
+}
+
+#[cfg(feature = "arrow")]
+impl From<Box<dyn Array>> for arrow_array::ArrayRef {
+    fn from(value: Box<dyn Array>) -> Self {
+        value.as_ref().into()
+    }
+}
+
+#[cfg(feature = "arrow")]
+impl From<&dyn Array> for arrow_array::ArrayRef {
+    fn from(value: &dyn Array) -> Self {
+        arrow_array::make_array(to_data(value))
+    }
+}
+
+#[cfg(feature = "arrow")]
+impl From<arrow_array::ArrayRef> for Box<dyn Array> {
+    fn from(value: arrow_array::ArrayRef) -> Self {
+        value.as_ref().into()
+    }
+}
+
+#[cfg(feature = "arrow")]
+impl From<&dyn arrow_array::Array> for Box<dyn Array> {
+    fn from(value: &dyn arrow_array::Array) -> Self {
+        from_data(&value.to_data())
+    }
+}
+
+/// Convert an arrow2 [`Array`] to [`arrow_data::ArrayData`]
+#[cfg(feature = "arrow")]
+pub fn to_data(array: &dyn Array) -> arrow_data::ArrayData {
+    use crate::datatypes::PhysicalType::*;
+    match array.data_type().to_physical_type() {
+        Null => to_data_dyn!(array, NullArray),
+        Boolean => to_data_dyn!(array, BooleanArray),
+        Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+            to_data_dyn!(array, PrimitiveArray<$T>)
+        }),
+        Binary => to_data_dyn!(array, BinaryArray<i32>),
+        LargeBinary => to_data_dyn!(array, BinaryArray<i64>),
+        FixedSizeBinary => to_data_dyn!(array, FixedSizeBinaryArray),
+        Utf8 => to_data_dyn!(array, Utf8Array::<i32>),
+        LargeUtf8 => to_data_dyn!(array, Utf8Array::<i64>),
+        List => to_data_dyn!(array, ListArray::<i32>),
+        LargeList => to_data_dyn!(array, ListArray::<i64>),
+        FixedSizeList => to_data_dyn!(array, FixedSizeListArray),
+        Struct => to_data_dyn!(array, StructArray),
+        Union => to_data_dyn!(array, UnionArray),
+        Dictionary(key_type) => {
+            match_integer_type!(key_type, |$T| {
+                to_data_dyn!(array, DictionaryArray::<$T>)
+            })
+        },
+        Map => to_data_dyn!(array, MapArray),
+    }
+}
+
+/// Convert an [`arrow_data::ArrayData`] to arrow2 [`Array`]
+#[cfg(feature = "arrow")]
+pub fn from_data(data: &arrow_data::ArrayData) -> Box<dyn Array> {
+    use crate::datatypes::PhysicalType::*;
+    let data_type: DataType = data.data_type().clone().into();
+    match data_type.to_physical_type() {
+        Null => Box::new(NullArray::from_data(data)),
+        Boolean => Box::new(BooleanArray::from_data(data)),
+        Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+            Box::new(PrimitiveArray::<$T>::from_data(data))
+        }),
+        Binary => Box::new(BinaryArray::<i32>::from_data(data)),
+        LargeBinary => Box::new(BinaryArray::<i64>::from_data(data)),
+        FixedSizeBinary => Box::new(FixedSizeBinaryArray::from_data(data)),
+        Utf8 => Box::new(Utf8Array::<i32>::from_data(data)),
+        LargeUtf8 => Box::new(Utf8Array::<i64>::from_data(data)),
+        List => Box::new(ListArray::<i32>::from_data(data)),
+        LargeList => Box::new(ListArray::<i64>::from_data(data)),
+        FixedSizeList => Box::new(FixedSizeListArray::from_data(data)),
+        Struct => Box::new(StructArray::from_data(data)),
+        Union => Box::new(UnionArray::from_data(data)),
+        Dictionary(key_type) => {
+            match_integer_type!(key_type, |$T| {
+                Box::new(DictionaryArray::<$T>::from_data(data))
+            })
+        },
+        Map => Box::new(MapArray::from_data(data)),
+    }
+}
+
+macro_rules! clone_dyn {
+    ($array:expr, $ty:ty) => {{
+        let f = |x: &$ty| Box::new(x.clone());
+        general_dyn!($array, $ty, f)
+    }};
+}
+
+// macro implementing `sliced` and `sliced_unchecked`
+macro_rules! impl_sliced {
+    () => {
+        /// Returns this array sliced.
+        /// # Implementation
+        /// This function is `O(1)`.
+        /// # Panics
+        /// iff `offset + length > self.len()`.
+        #[inline]
+        #[must_use]
+        pub fn sliced(self, offset: usize, length: usize) -> Self {
+            assert!(
+                offset + length <= self.len(),
+                "the offset of the new Buffer cannot exceed the existing length"
+            );
+            unsafe { self.sliced_unchecked(offset, length) }
+        }
+
+        /// Returns this array sliced.
+        /// # Implementation
+        /// This function is `O(1)`.
+        /// # Safety
+        /// The caller must ensure that `offset + length <= self.len()`.
+        #[inline]
+        #[must_use]
+        pub unsafe fn sliced_unchecked(mut self, offset: usize, length: usize) -> Self {
+            self.slice_unchecked(offset, length);
+            self
+        }
+    };
+}
+
+// macro implementing `with_validity` and `set_validity`
+macro_rules! impl_mut_validity {
+    () => {
+        /// Returns this array with a new validity.
+        /// # Panic
+        /// Panics iff `validity.len() != self.len()`.
+        #[must_use]
+        #[inline]
+        pub fn with_validity(mut self, validity: Option<Bitmap>) -> Self {
+            self.set_validity(validity);
+            self
+        }
+
+        /// Sets the validity of this array.
+        /// # Panics
+        /// This function panics iff `values.len() != self.len()`.
+        #[inline]
+        pub fn set_validity(&mut self, validity: Option<Bitmap>) {
+            if matches!(&validity, Some(bitmap) if bitmap.len() != self.len()) {
+                panic!("validity must be equal to the array's length")
+            }
+            self.validity = validity;
+        }
+    }
+}
+
+// macro implementing `with_validity`, `set_validity` and `apply_validity` for mutable arrays
+macro_rules! impl_mutable_array_mut_validity {
+    () => {
+        /// Returns this array with a new validity.
+        /// # Panic
+        /// Panics iff `validity.len() != self.len()`.
+        #[must_use]
+        #[inline]
+        pub fn with_validity(mut self, validity: Option<MutableBitmap>) -> Self {
+            self.set_validity(validity);
+            self
+        }
+
+        /// Sets the validity of this array.
+        /// # Panics
+        /// This function panics iff `values.len() != self.len()`.
+        #[inline]
+        pub fn set_validity(&mut self, validity: Option<MutableBitmap>) {
+            if matches!(&validity, Some(bitmap) if bitmap.len() != self.len()) {
+                panic!("validity must be equal to the array's length")
+            }
+            self.validity = validity;
+        }
+
+        /// Applies a function `f` to the validity of this array.
+        ///
+        /// This is an API to leverage clone-on-write
+        /// # Panics
+        /// This function panics if the function `f` modifies the length of the [`Bitmap`].
+        #[inline]
+        pub fn apply_validity<F: FnOnce(MutableBitmap) -> MutableBitmap>(&mut self, f: F) {
+            if let Some(validity) = std::mem::take(&mut self.validity) {
+                self.set_validity(Some(f(validity)))
+            }
+        }
+
+    }
+}
+
+// macro implementing `boxed` and `arced`
+macro_rules! impl_into_array {
+    () => {
+        /// Boxes this array into a [`Box<dyn Array>`].
+        pub fn boxed(self) -> Box<dyn Array> {
+            Box::new(self)
+        }
+
+        /// Arcs this array into a [`std::sync::Arc<dyn Array>`].
+        pub fn arced(self) -> std::sync::Arc<dyn Array> {
+            std::sync::Arc::new(self)
+        }
+    };
+}
+
+// macro implementing common methods of trait `Array`
+macro_rules! impl_common_array {
+    () => {
+        #[inline]
+        fn as_any(&self) -> &dyn std::any::Any {
+            self
+        }
+
+        #[inline]
+        fn as_any_mut(&mut self) -> &mut dyn std::any::Any {
+            self
+        }
+
+        #[inline]
+        fn len(&self) -> usize {
+            self.len()
+        }
+
+        #[inline]
+        fn data_type(&self) -> &DataType {
+            &self.data_type
+        }
+
+        #[inline]
+        fn slice(&mut self, offset: usize, length: usize) {
+            self.slice(offset, length);
+        }
+
+        #[inline]
+        unsafe fn slice_unchecked(&mut self, offset: usize, length: usize) {
+            self.slice_unchecked(offset, length);
+        }
+
+        #[inline]
+        fn to_boxed(&self) -> Box<dyn Array> {
+            Box::new(self.clone())
+        }
+    };
+}
+
+/// Clones a dynamic [`Array`].
+/// # Implementation
+/// This operation is `O(1)` over `len`, as it amounts to increase two ref counts
+/// and moving the concrete struct under a `Box`.
+pub fn clone(array: &dyn Array) -> Box<dyn Array> {
+    use crate::datatypes::PhysicalType::*;
+    match array.data_type().to_physical_type() {
+        Null => clone_dyn!(array, NullArray),
+        Boolean => clone_dyn!(array, BooleanArray),
+        Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+            clone_dyn!(array, PrimitiveArray<$T>)
+        }),
+        Binary => clone_dyn!(array, BinaryArray<i32>),
+        LargeBinary => clone_dyn!(array, BinaryArray<i64>),
+        FixedSizeBinary => clone_dyn!(array, FixedSizeBinaryArray),
+        Utf8 => clone_dyn!(array, Utf8Array::<i32>),
+        LargeUtf8 => clone_dyn!(array, Utf8Array::<i64>),
+        List => clone_dyn!(array, ListArray::<i32>),
+        LargeList => clone_dyn!(array, ListArray::<i64>),
+        FixedSizeList => clone_dyn!(array, FixedSizeListArray),
+        Struct => clone_dyn!(array, StructArray),
+        Union => clone_dyn!(array, UnionArray),
+        Map => clone_dyn!(array, MapArray),
+        Dictionary(key_type) => {
+            match_integer_type!(key_type, |$T| {
+                clone_dyn!(array, DictionaryArray::<$T>)
+            })
+        },
+    }
+}
+
+// see https://users.rust-lang.org/t/generic-for-dyn-a-or-box-dyn-a-or-arc-dyn-a/69430/3
+// for details
+impl<'a> AsRef<(dyn Array + 'a)> for dyn Array {
+    fn as_ref(&self) -> &(dyn Array + 'a) {
+        self
+    }
+}
+
+mod binary;
+mod boolean;
+mod dictionary;
+mod fixed_size_binary;
+mod fixed_size_list;
+mod list;
+mod map;
+mod null;
+mod primitive;
+mod specification;
+mod struct_;
+mod union;
+mod utf8;
+
+mod equal;
+mod ffi;
+mod fmt;
+#[doc(hidden)]
+pub mod indexable;
+mod iterator;
+
+pub mod growable;
+pub mod ord;
+
+pub use binary::{BinaryArray, BinaryValueIter, MutableBinaryArray, MutableBinaryValuesArray};
+pub use boolean::{BooleanArray, MutableBooleanArray};
+pub use dictionary::{DictionaryArray, DictionaryKey, MutableDictionaryArray};
+pub use equal::equal;
+pub use fixed_size_binary::{FixedSizeBinaryArray, MutableFixedSizeBinaryArray};
+pub use fixed_size_list::{FixedSizeListArray, MutableFixedSizeListArray};
+pub use fmt::{get_display, get_value_display};
+pub(crate) use iterator::ArrayAccessor;
+pub use iterator::ArrayValuesIter;
+pub use list::{ListArray, ListValuesIter, MutableListArray};
+pub use map::MapArray;
+pub use null::{MutableNullArray, NullArray};
+pub use primitive::*;
+pub use struct_::{MutableStructArray, StructArray};
+pub use union::UnionArray;
+pub use utf8::{MutableUtf8Array, MutableUtf8ValuesArray, Utf8Array, Utf8ValuesIter};
+
+pub(crate) use self::ffi::{offset_buffers_children_dictionary, FromFfi, ToFfi};
+
+/// A trait describing the ability of a struct to create itself from a iterator.
+/// This is similar to [`Extend`], but accepted the creation to error.
+pub trait TryExtend<A> {
+    /// Fallible version of [`Extend::extend`].
+    fn try_extend<I: IntoIterator<Item = A>>(&mut self, iter: I) -> Result<()>;
+}
+
+/// A trait describing the ability of a struct to receive new items.
+pub trait TryPush<A> {
+    /// Tries to push a new element.
+    fn try_push(&mut self, item: A) -> Result<()>;
+}
+
+/// A trait describing the ability of a struct to receive new items.
+pub trait PushUnchecked<A> {
+    /// Push a new element that holds the invariants of the struct.
+    /// # Safety
+    /// The items must uphold the invariants of the struct
+    /// Read the specific implementation of the trait to understand what these are.
+    unsafe fn push_unchecked(&mut self, item: A);
+}
+
+/// A trait describing the ability of a struct to extend from a reference of itself.
+/// Specialization of [`TryExtend`].
+pub trait TryExtendFromSelf {
+    /// Tries to extend itself with elements from `other`, failing only on overflow.
+    fn try_extend_from_self(&mut self, other: &Self) -> Result<()>;
+}
+
+/// Trait that [`BinaryArray`] and [`Utf8Array`] implement for the purposes of DRY.
+/// # Safety
+/// The implementer must ensure that
+/// 1. `offsets.len() > 0`
+/// 2. `offsets[i] >= offsets[i-1] for all i`
+/// 3. `offsets[i] < values.len() for all i`
+pub unsafe trait GenericBinaryArray<O: crate::offset::Offset>: Array {
+    /// The values of the array
+    fn values(&self) -> &[u8];
+    /// The offsets of the array
+    fn offsets(&self) -> &[O];
+}
diff --git a/crates/nano-arrow/src/array/null.rs b/crates/nano-arrow/src/array/null.rs
new file mode 100644
index 000000000000..0fb9dd6644bd
--- /dev/null
+++ b/crates/nano-arrow/src/array/null.rs
@@ -0,0 +1,200 @@
+use std::any::Any;
+
+use crate::array::{Array, FromFfi, MutableArray, ToFfi};
+use crate::bitmap::{Bitmap, MutableBitmap};
+use crate::datatypes::{DataType, PhysicalType};
+use crate::error::Error;
+use crate::ffi;
+
+/// The concrete [`Array`] of [`DataType::Null`].
+#[derive(Clone)]
+pub struct NullArray {
+    data_type: DataType,
+    length: usize,
+}
+
+impl NullArray {
+    /// Returns a new [`NullArray`].
+    /// # Errors
+    /// This function errors iff:
+    /// * The `data_type`'s [`crate::datatypes::PhysicalType`] is not equal to [`crate::datatypes::PhysicalType::Null`].
+    pub fn try_new(data_type: DataType, length: usize) -> Result<Self, Error> {
+        if data_type.to_physical_type() != PhysicalType::Null {
+            return Err(Error::oos(
+                "NullArray can only be initialized with a DataType whose physical type is Boolean",
+            ));
+        }
+
+        Ok(Self { data_type, length })
+    }
+
+    /// Returns a new [`NullArray`].
+    /// # Panics
+    /// This function errors iff:
+    /// * The `data_type`'s [`crate::datatypes::PhysicalType`] is not equal to [`crate::datatypes::PhysicalType::Null`].
+    pub fn new(data_type: DataType, length: usize) -> Self {
+        Self::try_new(data_type, length).unwrap()
+    }
+
+    /// Returns a new empty [`NullArray`].
+    pub fn new_empty(data_type: DataType) -> Self {
+        Self::new(data_type, 0)
+    }
+
+    /// Returns a new [`NullArray`].
+    pub fn new_null(data_type: DataType, length: usize) -> Self {
+        Self::new(data_type, length)
+    }
+
+    impl_sliced!();
+    impl_into_array!();
+}
+
+impl NullArray {
+    /// Returns a slice of the [`NullArray`].
+    /// # Panic
+    /// This function panics iff `offset + length > self.len()`.
+    pub fn slice(&mut self, offset: usize, length: usize) {
+        assert!(
+            offset + length <= self.len(),
+            "the offset of the new array cannot exceed the arrays' length"
+        );
+        unsafe { self.slice_unchecked(offset, length) };
+    }
+
+    /// Returns a slice of the [`NullArray`].
+    /// # Safety
+    /// The caller must ensure that `offset + length < self.len()`.
+    pub unsafe fn slice_unchecked(&mut self, _offset: usize, length: usize) {
+        self.length = length;
+    }
+
+    #[inline]
+    fn len(&self) -> usize {
+        self.length
+    }
+}
+
+impl Array for NullArray {
+    impl_common_array!();
+
+    fn validity(&self) -> Option<&Bitmap> {
+        None
+    }
+
+    fn with_validity(&self, _: Option<Bitmap>) -> Box<dyn Array> {
+        panic!("cannot set validity of a null array")
+    }
+}
+
+#[derive(Debug)]
+/// A distinct type to disambiguate
+/// clashing methods
+pub struct MutableNullArray {
+    inner: NullArray,
+}
+
+impl MutableNullArray {
+    /// Returns a new [`MutableNullArray`].
+    /// # Panics
+    /// This function errors iff:
+    /// * The `data_type`'s [`crate::datatypes::PhysicalType`] is not equal to [`crate::datatypes::PhysicalType::Null`].
+    pub fn new(data_type: DataType, length: usize) -> Self {
+        let inner = NullArray::try_new(data_type, length).unwrap();
+        Self { inner }
+    }
+}
+
+impl From<MutableNullArray> for NullArray {
+    fn from(value: MutableNullArray) -> Self {
+        value.inner
+    }
+}
+
+impl MutableArray for MutableNullArray {
+    fn data_type(&self) -> &DataType {
+        &DataType::Null
+    }
+
+    fn len(&self) -> usize {
+        self.inner.length
+    }
+
+    fn validity(&self) -> Option<&MutableBitmap> {
+        None
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        self.inner.clone().boxed()
+    }
+
+    fn as_any(&self) -> &dyn Any {
+        self
+    }
+
+    fn as_mut_any(&mut self) -> &mut dyn Any {
+        self
+    }
+
+    fn push_null(&mut self) {
+        self.inner.length += 1;
+    }
+
+    fn reserve(&mut self, _additional: usize) {
+        // no-op
+    }
+
+    fn shrink_to_fit(&mut self) {
+        // no-op
+    }
+}
+
+impl std::fmt::Debug for NullArray {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        write!(f, "NullArray({})", self.len())
+    }
+}
+
+unsafe impl ToFfi for NullArray {
+    fn buffers(&self) -> Vec<Option<*const u8>> {
+        // `None` is technically not required by the specification, but older C++ implementations require it, so leaving
+        // it here for backward compatibility
+        vec![None]
+    }
+
+    fn offset(&self) -> Option<usize> {
+        Some(0)
+    }
+
+    fn to_ffi_aligned(&self) -> Self {
+        self.clone()
+    }
+}
+
+impl<A: ffi::ArrowArrayRef> FromFfi<A> for NullArray {
+    unsafe fn try_from_ffi(array: A) -> Result<Self, Error> {
+        let data_type = array.data_type().clone();
+        Self::try_new(data_type, array.array().len())
+    }
+}
+
+#[cfg(feature = "arrow")]
+mod arrow {
+    use arrow_data::{ArrayData, ArrayDataBuilder};
+
+    use super::*;
+    impl NullArray {
+        /// Convert this array into [`arrow_data::ArrayData`]
+        pub fn to_data(&self) -> ArrayData {
+            let builder = ArrayDataBuilder::new(arrow_schema::DataType::Null).len(self.len());
+
+            // Safety: safe by construction
+            unsafe { builder.build_unchecked() }
+        }
+
+        /// Create this array from [`ArrayData`]
+        pub fn from_data(data: &ArrayData) -> Self {
+            Self::new(DataType::Null, data.len())
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/array/ord.rs b/crates/nano-arrow/src/array/ord.rs
new file mode 100644
index 000000000000..914eff2639f8
--- /dev/null
+++ b/crates/nano-arrow/src/array/ord.rs
@@ -0,0 +1,245 @@
+//! Contains functions and function factories to order values within arrays.
+
+use std::cmp::Ordering;
+
+use crate::array::*;
+use crate::datatypes::*;
+use crate::error::{Error, Result};
+use crate::offset::Offset;
+use crate::types::NativeType;
+
+/// Compare the values at two arbitrary indices in two arrays.
+pub type DynComparator = Box<dyn Fn(usize, usize) -> Ordering + Send + Sync>;
+
+/// implements comparison using IEEE 754 total ordering for f32
+// Original implementation from https://doc.rust-lang.org/std/primitive.f32.html#method.total_cmp
+// TODO to change to use std when it becomes stable
+#[inline]
+pub fn total_cmp_f32(l: &f32, r: &f32) -> std::cmp::Ordering {
+    let mut left = l.to_bits() as i32;
+    let mut right = r.to_bits() as i32;
+
+    left ^= (((left >> 31) as u32) >> 1) as i32;
+    right ^= (((right >> 31) as u32) >> 1) as i32;
+
+    left.cmp(&right)
+}
+
+/// implements comparison using IEEE 754 total ordering for f64
+// Original implementation from https://doc.rust-lang.org/std/primitive.f64.html#method.total_cmp
+// TODO to change to use std when it becomes stable
+#[inline]
+pub fn total_cmp_f64(l: &f64, r: &f64) -> std::cmp::Ordering {
+    let mut left = l.to_bits() as i64;
+    let mut right = r.to_bits() as i64;
+
+    left ^= (((left >> 63) as u64) >> 1) as i64;
+    right ^= (((right >> 63) as u64) >> 1) as i64;
+
+    left.cmp(&right)
+}
+
+/// Total order of all native types whose Rust implementation
+/// that support total order.
+#[inline]
+pub fn total_cmp<T>(l: &T, r: &T) -> std::cmp::Ordering
+where
+    T: NativeType + Ord,
+{
+    l.cmp(r)
+}
+
+fn compare_primitives<T: NativeType + Ord>(left: &dyn Array, right: &dyn Array) -> DynComparator {
+    let left = left
+        .as_any()
+        .downcast_ref::<PrimitiveArray<T>>()
+        .unwrap()
+        .clone();
+    let right = right
+        .as_any()
+        .downcast_ref::<PrimitiveArray<T>>()
+        .unwrap()
+        .clone();
+    Box::new(move |i, j| total_cmp(&left.value(i), &right.value(j)))
+}
+
+fn compare_boolean(left: &dyn Array, right: &dyn Array) -> DynComparator {
+    let left = left
+        .as_any()
+        .downcast_ref::<BooleanArray>()
+        .unwrap()
+        .clone();
+    let right = right
+        .as_any()
+        .downcast_ref::<BooleanArray>()
+        .unwrap()
+        .clone();
+    Box::new(move |i, j| left.value(i).cmp(&right.value(j)))
+}
+
+fn compare_f32(left: &dyn Array, right: &dyn Array) -> DynComparator {
+    let left = left
+        .as_any()
+        .downcast_ref::<PrimitiveArray<f32>>()
+        .unwrap()
+        .clone();
+    let right = right
+        .as_any()
+        .downcast_ref::<PrimitiveArray<f32>>()
+        .unwrap()
+        .clone();
+    Box::new(move |i, j| total_cmp_f32(&left.value(i), &right.value(j)))
+}
+
+fn compare_f64(left: &dyn Array, right: &dyn Array) -> DynComparator {
+    let left = left
+        .as_any()
+        .downcast_ref::<PrimitiveArray<f64>>()
+        .unwrap()
+        .clone();
+    let right = right
+        .as_any()
+        .downcast_ref::<PrimitiveArray<f64>>()
+        .unwrap()
+        .clone();
+    Box::new(move |i, j| total_cmp_f64(&left.value(i), &right.value(j)))
+}
+
+fn compare_string<O: Offset>(left: &dyn Array, right: &dyn Array) -> DynComparator {
+    let left = left
+        .as_any()
+        .downcast_ref::<Utf8Array<O>>()
+        .unwrap()
+        .clone();
+    let right = right
+        .as_any()
+        .downcast_ref::<Utf8Array<O>>()
+        .unwrap()
+        .clone();
+    Box::new(move |i, j| left.value(i).cmp(right.value(j)))
+}
+
+fn compare_binary<O: Offset>(left: &dyn Array, right: &dyn Array) -> DynComparator {
+    let left = left
+        .as_any()
+        .downcast_ref::<BinaryArray<O>>()
+        .unwrap()
+        .clone();
+    let right = right
+        .as_any()
+        .downcast_ref::<BinaryArray<O>>()
+        .unwrap()
+        .clone();
+    Box::new(move |i, j| left.value(i).cmp(right.value(j)))
+}
+
+fn compare_dict<K>(left: &DictionaryArray<K>, right: &DictionaryArray<K>) -> Result<DynComparator>
+where
+    K: DictionaryKey,
+{
+    let left_keys = left.keys().values().clone();
+    let right_keys = right.keys().values().clone();
+
+    let comparator = build_compare(left.values().as_ref(), right.values().as_ref())?;
+
+    Ok(Box::new(move |i: usize, j: usize| {
+        // safety: all dictionaries keys are guaranteed to be castable to usize
+        let key_left = unsafe { left_keys[i].as_usize() };
+        let key_right = unsafe { right_keys[j].as_usize() };
+        (comparator)(key_left, key_right)
+    }))
+}
+
+macro_rules! dyn_dict {
+    ($key:ty, $lhs:expr, $rhs:expr) => {{
+        let lhs = $lhs.as_any().downcast_ref().unwrap();
+        let rhs = $rhs.as_any().downcast_ref().unwrap();
+        compare_dict::<$key>(lhs, rhs)?
+    }};
+}
+
+/// returns a comparison function that compares values at two different slots
+/// between two [`Array`].
+/// # Example
+/// ```
+/// use arrow2::array::{ord::build_compare, PrimitiveArray};
+///
+/// # fn main() -> arrow2::error::Result<()> {
+/// let array1 = PrimitiveArray::from_slice([1, 2]);
+/// let array2 = PrimitiveArray::from_slice([3, 4]);
+///
+/// let cmp = build_compare(&array1, &array2)?;
+///
+/// // 1 (index 0 of array1) is smaller than 4 (index 1 of array2)
+/// assert_eq!(std::cmp::Ordering::Less, (cmp)(0, 1));
+/// # Ok(())
+/// # }
+/// ```
+/// # Error
+/// The arrays' [`DataType`] must be equal and the types must have a natural order.
+// This is a factory of comparisons.
+pub fn build_compare(left: &dyn Array, right: &dyn Array) -> Result<DynComparator> {
+    use DataType::*;
+    use IntervalUnit::*;
+    use TimeUnit::*;
+    Ok(match (left.data_type(), right.data_type()) {
+        (a, b) if a != b => {
+            return Err(Error::InvalidArgumentError(
+                "Can't compare arrays of different types".to_string(),
+            ));
+        },
+        (Boolean, Boolean) => compare_boolean(left, right),
+        (UInt8, UInt8) => compare_primitives::<u8>(left, right),
+        (UInt16, UInt16) => compare_primitives::<u16>(left, right),
+        (UInt32, UInt32) => compare_primitives::<u32>(left, right),
+        (UInt64, UInt64) => compare_primitives::<u64>(left, right),
+        (Int8, Int8) => compare_primitives::<i8>(left, right),
+        (Int16, Int16) => compare_primitives::<i16>(left, right),
+        (Int32, Int32)
+        | (Date32, Date32)
+        | (Time32(Second), Time32(Second))
+        | (Time32(Millisecond), Time32(Millisecond))
+        | (Interval(YearMonth), Interval(YearMonth)) => compare_primitives::<i32>(left, right),
+        (Int64, Int64)
+        | (Date64, Date64)
+        | (Time64(Microsecond), Time64(Microsecond))
+        | (Time64(Nanosecond), Time64(Nanosecond))
+        | (Timestamp(Second, None), Timestamp(Second, None))
+        | (Timestamp(Millisecond, None), Timestamp(Millisecond, None))
+        | (Timestamp(Microsecond, None), Timestamp(Microsecond, None))
+        | (Timestamp(Nanosecond, None), Timestamp(Nanosecond, None))
+        | (Duration(Second), Duration(Second))
+        | (Duration(Millisecond), Duration(Millisecond))
+        | (Duration(Microsecond), Duration(Microsecond))
+        | (Duration(Nanosecond), Duration(Nanosecond)) => compare_primitives::<i64>(left, right),
+        (Float32, Float32) => compare_f32(left, right),
+        (Float64, Float64) => compare_f64(left, right),
+        (Decimal(_, _), Decimal(_, _)) => compare_primitives::<i128>(left, right),
+        (Utf8, Utf8) => compare_string::<i32>(left, right),
+        (LargeUtf8, LargeUtf8) => compare_string::<i64>(left, right),
+        (Binary, Binary) => compare_binary::<i32>(left, right),
+        (LargeBinary, LargeBinary) => compare_binary::<i64>(left, right),
+        (Dictionary(key_type_lhs, ..), Dictionary(key_type_rhs, ..)) => {
+            match (key_type_lhs, key_type_rhs) {
+                (IntegerType::UInt8, IntegerType::UInt8) => dyn_dict!(u8, left, right),
+                (IntegerType::UInt16, IntegerType::UInt16) => dyn_dict!(u16, left, right),
+                (IntegerType::UInt32, IntegerType::UInt32) => dyn_dict!(u32, left, right),
+                (IntegerType::UInt64, IntegerType::UInt64) => dyn_dict!(u64, left, right),
+                (IntegerType::Int8, IntegerType::Int8) => dyn_dict!(i8, left, right),
+                (IntegerType::Int16, IntegerType::Int16) => dyn_dict!(i16, left, right),
+                (IntegerType::Int32, IntegerType::Int32) => dyn_dict!(i32, left, right),
+                (IntegerType::Int64, IntegerType::Int64) => dyn_dict!(i64, left, right),
+                (lhs, _) => {
+                    return Err(Error::InvalidArgumentError(format!(
+                        "Dictionaries do not support keys of type {lhs:?}"
+                    )))
+                },
+            }
+        },
+        (lhs, _) => {
+            return Err(Error::InvalidArgumentError(format!(
+                "The data type type {lhs:?} has no natural order"
+            )))
+        },
+    })
+}
diff --git a/crates/nano-arrow/src/array/physical_binary.rs b/crates/nano-arrow/src/array/physical_binary.rs
new file mode 100644
index 000000000000..694e61a7ea63
--- /dev/null
+++ b/crates/nano-arrow/src/array/physical_binary.rs
@@ -0,0 +1,230 @@
+use crate::bitmap::MutableBitmap;
+use crate::offset::{Offset, Offsets};
+
+/// # Safety
+/// The caller must ensure that `iterator` is `TrustedLen`.
+#[inline]
+#[allow(clippy::type_complexity)]
+pub(crate) unsafe fn try_trusted_len_unzip<E, I, P, O>(
+    iterator: I,
+) -> std::result::Result<(Option<MutableBitmap>, Offsets<O>, Vec<u8>), E>
+where
+    O: Offset,
+    P: AsRef<[u8]>,
+    I: Iterator<Item = std::result::Result<Option<P>, E>>,
+{
+    let (_, upper) = iterator.size_hint();
+    let len = upper.expect("trusted_len_unzip requires an upper limit");
+
+    let mut null = MutableBitmap::with_capacity(len);
+    let mut offsets = Vec::<O>::with_capacity(len + 1);
+    let mut values = Vec::<u8>::new();
+
+    let mut length = O::default();
+    let mut dst = offsets.as_mut_ptr();
+    std::ptr::write(dst, length);
+    dst = dst.add(1);
+    for item in iterator {
+        if let Some(item) = item? {
+            null.push_unchecked(true);
+            let s = item.as_ref();
+            length += O::from_usize(s.len()).unwrap();
+            values.extend_from_slice(s);
+        } else {
+            null.push_unchecked(false);
+        };
+
+        std::ptr::write(dst, length);
+        dst = dst.add(1);
+    }
+    assert_eq!(
+        dst.offset_from(offsets.as_ptr()) as usize,
+        len + 1,
+        "Trusted iterator length was not accurately reported"
+    );
+    offsets.set_len(len + 1);
+
+    Ok((null.into(), Offsets::new_unchecked(offsets), values))
+}
+
+/// Creates [`MutableBitmap`] and two [`Vec`]s from an iterator of `Option`.
+/// The first buffer corresponds to a offset buffer, the second one
+/// corresponds to a values buffer.
+/// # Safety
+/// The caller must ensure that `iterator` is `TrustedLen`.
+#[inline]
+pub(crate) unsafe fn trusted_len_unzip<O, I, P>(
+    iterator: I,
+) -> (Option<MutableBitmap>, Offsets<O>, Vec<u8>)
+where
+    O: Offset,
+    P: AsRef<[u8]>,
+    I: Iterator<Item = Option<P>>,
+{
+    let (_, upper) = iterator.size_hint();
+    let len = upper.expect("trusted_len_unzip requires an upper limit");
+
+    let mut offsets = Offsets::<O>::with_capacity(len);
+    let mut values = Vec::<u8>::new();
+    let mut validity = MutableBitmap::new();
+
+    extend_from_trusted_len_iter(&mut offsets, &mut values, &mut validity, iterator);
+
+    let validity = if validity.unset_bits() > 0 {
+        Some(validity)
+    } else {
+        None
+    };
+
+    (validity, offsets, values)
+}
+
+/// Creates two [`Buffer`]s from an iterator of `&[u8]`.
+/// The first buffer corresponds to a offset buffer, the second to a values buffer.
+/// # Safety
+/// The caller must ensure that `iterator` is [`TrustedLen`].
+#[inline]
+pub(crate) unsafe fn trusted_len_values_iter<O, I, P>(iterator: I) -> (Offsets<O>, Vec<u8>)
+where
+    O: Offset,
+    P: AsRef<[u8]>,
+    I: Iterator<Item = P>,
+{
+    let (_, upper) = iterator.size_hint();
+    let len = upper.expect("trusted_len_unzip requires an upper limit");
+
+    let mut offsets = Offsets::<O>::with_capacity(len);
+    let mut values = Vec::<u8>::new();
+
+    extend_from_trusted_len_values_iter(&mut offsets, &mut values, iterator);
+
+    (offsets, values)
+}
+
+// Populates `offsets` and `values` [`Vec`]s with information extracted
+// from the incoming `iterator`.
+// # Safety
+// The caller must ensure the `iterator` is [`TrustedLen`]
+#[inline]
+pub(crate) unsafe fn extend_from_trusted_len_values_iter<I, P, O>(
+    offsets: &mut Offsets<O>,
+    values: &mut Vec<u8>,
+    iterator: I,
+) where
+    O: Offset,
+    P: AsRef<[u8]>,
+    I: Iterator<Item = P>,
+{
+    let lengths = iterator.map(|item| {
+        let s = item.as_ref();
+        // Push new entries for both `values` and `offsets` buffer
+        values.extend_from_slice(s);
+        s.len()
+    });
+    offsets.try_extend_from_lengths(lengths).unwrap();
+}
+
+// Populates `offsets` and `values` [`Vec`]s with information extracted
+// from the incoming `iterator`.
+// the return value indicates how many items were added.
+#[inline]
+pub(crate) fn extend_from_values_iter<I, P, O>(
+    offsets: &mut Offsets<O>,
+    values: &mut Vec<u8>,
+    iterator: I,
+) -> usize
+where
+    O: Offset,
+    P: AsRef<[u8]>,
+    I: Iterator<Item = P>,
+{
+    let (size_hint, _) = iterator.size_hint();
+
+    offsets.reserve(size_hint);
+
+    let start_index = offsets.len_proxy();
+
+    for item in iterator {
+        let bytes = item.as_ref();
+        values.extend_from_slice(bytes);
+        offsets.try_push_usize(bytes.len()).unwrap();
+    }
+    offsets.len_proxy() - start_index
+}
+
+// Populates `offsets`, `values`, and `validity` [`Vec`]s with
+// information extracted from the incoming `iterator`.
+//
+// # Safety
+// The caller must ensure that `iterator` is [`TrustedLen`]
+#[inline]
+pub(crate) unsafe fn extend_from_trusted_len_iter<O, I, P>(
+    offsets: &mut Offsets<O>,
+    values: &mut Vec<u8>,
+    validity: &mut MutableBitmap,
+    iterator: I,
+) where
+    O: Offset,
+    P: AsRef<[u8]>,
+    I: Iterator<Item = Option<P>>,
+{
+    let (_, upper) = iterator.size_hint();
+    let additional = upper.expect("extend_from_trusted_len_iter requires an upper limit");
+
+    offsets.reserve(additional);
+    validity.reserve(additional);
+
+    let lengths = iterator.map(|item| {
+        if let Some(item) = item {
+            let bytes = item.as_ref();
+            values.extend_from_slice(bytes);
+            validity.push_unchecked(true);
+            bytes.len()
+        } else {
+            validity.push_unchecked(false);
+            0
+        }
+    });
+    offsets.try_extend_from_lengths(lengths).unwrap();
+}
+
+/// Creates two [`Vec`]s from an iterator of `&[u8]`.
+/// The first buffer corresponds to a offset buffer, the second to a values buffer.
+#[inline]
+pub(crate) fn values_iter<O, I, P>(iterator: I) -> (Offsets<O>, Vec<u8>)
+where
+    O: Offset,
+    P: AsRef<[u8]>,
+    I: Iterator<Item = P>,
+{
+    let (lower, _) = iterator.size_hint();
+
+    let mut offsets = Offsets::<O>::with_capacity(lower);
+    let mut values = Vec::<u8>::new();
+
+    for item in iterator {
+        let s = item.as_ref();
+        values.extend_from_slice(s);
+        offsets.try_push_usize(s.len()).unwrap();
+    }
+    (offsets, values)
+}
+
+/// Extends `validity` with all items from `other`
+pub(crate) fn extend_validity(
+    length: usize,
+    validity: &mut Option<MutableBitmap>,
+    other: &Option<MutableBitmap>,
+) {
+    if let Some(other) = other {
+        if let Some(validity) = validity {
+            let slice = other.as_slice();
+            // safety: invariant offset + length <= slice.len()
+            unsafe { validity.extend_from_slice_unchecked(slice, 0, other.len()) }
+        } else {
+            let mut new_validity = MutableBitmap::from_len_set(length);
+            new_validity.extend_from_slice(other.as_slice(), 0, other.len());
+            *validity = Some(new_validity);
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/array/primitive/data.rs b/crates/nano-arrow/src/array/primitive/data.rs
new file mode 100644
index 000000000000..d4879f796812
--- /dev/null
+++ b/crates/nano-arrow/src/array/primitive/data.rs
@@ -0,0 +1,33 @@
+use arrow_data::{ArrayData, ArrayDataBuilder};
+
+use crate::array::{Arrow2Arrow, PrimitiveArray};
+use crate::bitmap::Bitmap;
+use crate::buffer::Buffer;
+use crate::types::NativeType;
+
+impl<T: NativeType> Arrow2Arrow for PrimitiveArray<T> {
+    fn to_data(&self) -> ArrayData {
+        let data_type = self.data_type.clone().into();
+
+        let builder = ArrayDataBuilder::new(data_type)
+            .len(self.len())
+            .buffers(vec![self.values.clone().into()])
+            .nulls(self.validity.as_ref().map(|b| b.clone().into()));
+
+        // Safety: Array is valid
+        unsafe { builder.build_unchecked() }
+    }
+
+    fn from_data(data: &ArrayData) -> Self {
+        let data_type = data.data_type().clone().into();
+
+        let mut values: Buffer<T> = data.buffers()[0].clone().into();
+        values.slice(data.offset(), data.len());
+
+        Self {
+            data_type,
+            values,
+            validity: data.nulls().map(|n| Bitmap::from_null_buffer(n.clone())),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/array/primitive/ffi.rs b/crates/nano-arrow/src/array/primitive/ffi.rs
new file mode 100644
index 000000000000..c74c157f750f
--- /dev/null
+++ b/crates/nano-arrow/src/array/primitive/ffi.rs
@@ -0,0 +1,56 @@
+use super::PrimitiveArray;
+use crate::array::{FromFfi, ToFfi};
+use crate::bitmap::align;
+use crate::error::Result;
+use crate::ffi;
+use crate::types::NativeType;
+
+unsafe impl<T: NativeType> ToFfi for PrimitiveArray<T> {
+    fn buffers(&self) -> Vec<Option<*const u8>> {
+        vec![
+            self.validity.as_ref().map(|x| x.as_ptr()),
+            Some(self.values.as_ptr().cast::<u8>()),
+        ]
+    }
+
+    fn offset(&self) -> Option<usize> {
+        let offset = self.values.offset();
+        if let Some(bitmap) = self.validity.as_ref() {
+            if bitmap.offset() == offset {
+                Some(offset)
+            } else {
+                None
+            }
+        } else {
+            Some(offset)
+        }
+    }
+
+    fn to_ffi_aligned(&self) -> Self {
+        let offset = self.values.offset();
+
+        let validity = self.validity.as_ref().map(|bitmap| {
+            if bitmap.offset() == offset {
+                bitmap.clone()
+            } else {
+                align(bitmap, offset)
+            }
+        });
+
+        Self {
+            data_type: self.data_type.clone(),
+            validity,
+            values: self.values.clone(),
+        }
+    }
+}
+
+impl<T: NativeType, A: ffi::ArrowArrayRef> FromFfi<A> for PrimitiveArray<T> {
+    unsafe fn try_from_ffi(array: A) -> Result<Self> {
+        let data_type = array.data_type().clone();
+        let validity = unsafe { array.validity() }?;
+        let values = unsafe { array.buffer::<T>(1) }?;
+
+        Self::try_new(data_type, values, validity)
+    }
+}
diff --git a/crates/nano-arrow/src/array/primitive/fmt.rs b/crates/nano-arrow/src/array/primitive/fmt.rs
new file mode 100644
index 000000000000..3743a16a188e
--- /dev/null
+++ b/crates/nano-arrow/src/array/primitive/fmt.rs
@@ -0,0 +1,149 @@
+#![allow(clippy::redundant_closure_call)]
+use std::fmt::{Debug, Formatter, Result, Write};
+
+use super::PrimitiveArray;
+use crate::array::fmt::write_vec;
+use crate::array::Array;
+use crate::datatypes::{IntervalUnit, TimeUnit};
+use crate::temporal_conversions;
+use crate::types::{days_ms, i256, months_days_ns, NativeType};
+
+macro_rules! dyn_primitive {
+    ($array:expr, $ty:ty, $expr:expr) => {{
+        let array = ($array as &dyn Array)
+            .as_any()
+            .downcast_ref::<PrimitiveArray<$ty>>()
+            .unwrap();
+        Box::new(move |f, index| write!(f, "{}", $expr(array.value(index))))
+    }};
+}
+
+pub fn get_write_value<'a, T: NativeType, F: Write>(
+    array: &'a PrimitiveArray<T>,
+) -> Box<dyn Fn(&mut F, usize) -> Result + 'a> {
+    use crate::datatypes::DataType::*;
+    match array.data_type().to_logical_type() {
+        Int8 => Box::new(|f, index| write!(f, "{}", array.value(index))),
+        Int16 => Box::new(|f, index| write!(f, "{}", array.value(index))),
+        Int32 => Box::new(|f, index| write!(f, "{}", array.value(index))),
+        Int64 => Box::new(|f, index| write!(f, "{}", array.value(index))),
+        UInt8 => Box::new(|f, index| write!(f, "{}", array.value(index))),
+        UInt16 => Box::new(|f, index| write!(f, "{}", array.value(index))),
+        UInt32 => Box::new(|f, index| write!(f, "{}", array.value(index))),
+        UInt64 => Box::new(|f, index| write!(f, "{}", array.value(index))),
+        Float16 => unreachable!(),
+        Float32 => Box::new(|f, index| write!(f, "{}", array.value(index))),
+        Float64 => Box::new(|f, index| write!(f, "{}", array.value(index))),
+        Date32 => {
+            dyn_primitive!(array, i32, temporal_conversions::date32_to_date)
+        },
+        Date64 => {
+            dyn_primitive!(array, i64, temporal_conversions::date64_to_date)
+        },
+        Time32(TimeUnit::Second) => {
+            dyn_primitive!(array, i32, temporal_conversions::time32s_to_time)
+        },
+        Time32(TimeUnit::Millisecond) => {
+            dyn_primitive!(array, i32, temporal_conversions::time32ms_to_time)
+        },
+        Time32(_) => unreachable!(), // remaining are not valid
+        Time64(TimeUnit::Microsecond) => {
+            dyn_primitive!(array, i64, temporal_conversions::time64us_to_time)
+        },
+        Time64(TimeUnit::Nanosecond) => {
+            dyn_primitive!(array, i64, temporal_conversions::time64ns_to_time)
+        },
+        Time64(_) => unreachable!(), // remaining are not valid
+        Timestamp(time_unit, tz) => {
+            if let Some(tz) = tz {
+                let timezone = temporal_conversions::parse_offset(tz);
+                match timezone {
+                    Ok(timezone) => {
+                        dyn_primitive!(array, i64, |time| {
+                            temporal_conversions::timestamp_to_datetime(time, *time_unit, &timezone)
+                        })
+                    },
+                    #[cfg(feature = "chrono-tz")]
+                    Err(_) => {
+                        let timezone = temporal_conversions::parse_offset_tz(tz);
+                        match timezone {
+                            Ok(timezone) => dyn_primitive!(array, i64, |time| {
+                                temporal_conversions::timestamp_to_datetime(
+                                    time, *time_unit, &timezone,
+                                )
+                            }),
+                            Err(_) => {
+                                let tz = tz.clone();
+                                Box::new(move |f, index| {
+                                    write!(f, "{} ({})", array.value(index), tz)
+                                })
+                            },
+                        }
+                    },
+                    #[cfg(not(feature = "chrono-tz"))]
+                    _ => {
+                        let tz = tz.clone();
+                        Box::new(move |f, index| write!(f, "{} ({})", array.value(index), tz))
+                    },
+                }
+            } else {
+                dyn_primitive!(array, i64, |time| {
+                    temporal_conversions::timestamp_to_naive_datetime(time, *time_unit)
+                })
+            }
+        },
+        Interval(IntervalUnit::YearMonth) => {
+            dyn_primitive!(array, i32, |x| format!("{x}m"))
+        },
+        Interval(IntervalUnit::DayTime) => {
+            dyn_primitive!(array, days_ms, |x: days_ms| format!(
+                "{}d{}ms",
+                x.days(),
+                x.milliseconds()
+            ))
+        },
+        Interval(IntervalUnit::MonthDayNano) => {
+            dyn_primitive!(array, months_days_ns, |x: months_days_ns| format!(
+                "{}m{}d{}ns",
+                x.months(),
+                x.days(),
+                x.ns()
+            ))
+        },
+        Duration(TimeUnit::Second) => dyn_primitive!(array, i64, |x| format!("{x}s")),
+        Duration(TimeUnit::Millisecond) => dyn_primitive!(array, i64, |x| format!("{x}ms")),
+        Duration(TimeUnit::Microsecond) => dyn_primitive!(array, i64, |x| format!("{x}us")),
+        Duration(TimeUnit::Nanosecond) => dyn_primitive!(array, i64, |x| format!("{x}ns")),
+        Decimal(_, scale) => {
+            // The number 999.99 has a precision of 5 and scale of 2
+            let scale = *scale as u32;
+            let factor = 10i128.pow(scale);
+            let display = move |x: i128| {
+                let base = x / factor;
+                let decimals = (x - base * factor).abs();
+                format!("{base}.{decimals}")
+            };
+            dyn_primitive!(array, i128, display)
+        },
+        Decimal256(_, scale) => {
+            let scale = *scale as u32;
+            let factor = (ethnum::I256::ONE * 10).pow(scale);
+            let display = move |x: i256| {
+                let base = x.0 / factor;
+                let decimals = (x.0 - base * factor).abs();
+                format!("{base}.{decimals}")
+            };
+            dyn_primitive!(array, i256, display)
+        },
+        _ => unreachable!(),
+    }
+}
+
+impl<T: NativeType> Debug for PrimitiveArray<T> {
+    fn fmt(&self, f: &mut Formatter<'_>) -> Result {
+        let writer = get_write_value(self);
+
+        write!(f, "{:?}", self.data_type())?;
+        write_vec(f, &*writer, self.validity(), self.len(), "None", false)
+    }
+}
diff --git a/crates/nano-arrow/src/array/primitive/from_natural.rs b/crates/nano-arrow/src/array/primitive/from_natural.rs
new file mode 100644
index 000000000000..0530c748af7e
--- /dev/null
+++ b/crates/nano-arrow/src/array/primitive/from_natural.rs
@@ -0,0 +1,16 @@
+use std::iter::FromIterator;
+
+use super::{MutablePrimitiveArray, PrimitiveArray};
+use crate::types::NativeType;
+
+impl<T: NativeType, P: AsRef<[Option<T>]>> From<P> for PrimitiveArray<T> {
+    fn from(slice: P) -> Self {
+        MutablePrimitiveArray::<T>::from(slice).into()
+    }
+}
+
+impl<T: NativeType, Ptr: std::borrow::Borrow<Option<T>>> FromIterator<Ptr> for PrimitiveArray<T> {
+    fn from_iter<I: IntoIterator<Item = Ptr>>(iter: I) -> Self {
+        MutablePrimitiveArray::<T>::from_iter(iter).into()
+    }
+}
diff --git a/crates/nano-arrow/src/array/primitive/iterator.rs b/crates/nano-arrow/src/array/primitive/iterator.rs
new file mode 100644
index 000000000000..9433979dad84
--- /dev/null
+++ b/crates/nano-arrow/src/array/primitive/iterator.rs
@@ -0,0 +1,47 @@
+use super::{MutablePrimitiveArray, PrimitiveArray};
+use crate::array::MutableArray;
+use crate::bitmap::utils::{BitmapIter, ZipValidity};
+use crate::bitmap::IntoIter as BitmapIntoIter;
+use crate::buffer::IntoIter;
+use crate::types::NativeType;
+
+impl<T: NativeType> IntoIterator for PrimitiveArray<T> {
+    type Item = Option<T>;
+    type IntoIter = ZipValidity<T, IntoIter<T>, BitmapIntoIter>;
+
+    #[inline]
+    fn into_iter(self) -> Self::IntoIter {
+        let (_, values, validity) = self.into_inner();
+        let values = values.into_iter();
+        let validity =
+            validity.and_then(|validity| (validity.unset_bits() > 0).then(|| validity.into_iter()));
+        ZipValidity::new(values, validity)
+    }
+}
+
+impl<'a, T: NativeType> IntoIterator for &'a PrimitiveArray<T> {
+    type Item = Option<&'a T>;
+    type IntoIter = ZipValidity<&'a T, std::slice::Iter<'a, T>, BitmapIter<'a>>;
+
+    #[inline]
+    fn into_iter(self) -> Self::IntoIter {
+        self.iter()
+    }
+}
+
+impl<'a, T: NativeType> MutablePrimitiveArray<T> {
+    /// Returns an iterator over `Option<T>`
+    #[inline]
+    pub fn iter(&'a self) -> ZipValidity<&'a T, std::slice::Iter<'a, T>, BitmapIter<'a>> {
+        ZipValidity::new(
+            self.values().iter(),
+            self.validity().as_ref().map(|x| x.iter()),
+        )
+    }
+
+    /// Returns an iterator of `T`
+    #[inline]
+    pub fn values_iter(&'a self) -> std::slice::Iter<'a, T> {
+        self.values().iter()
+    }
+}
diff --git a/crates/nano-arrow/src/array/primitive/mod.rs b/crates/nano-arrow/src/array/primitive/mod.rs
new file mode 100644
index 000000000000..a3f80a581210
--- /dev/null
+++ b/crates/nano-arrow/src/array/primitive/mod.rs
@@ -0,0 +1,510 @@
+use either::Either;
+
+use super::Array;
+use crate::bitmap::utils::{BitmapIter, ZipValidity};
+use crate::bitmap::Bitmap;
+use crate::buffer::Buffer;
+use crate::datatypes::*;
+use crate::error::Error;
+use crate::trusted_len::TrustedLen;
+use crate::types::{days_ms, f16, i256, months_days_ns, NativeType};
+
+#[cfg(feature = "arrow")]
+mod data;
+mod ffi;
+pub(super) mod fmt;
+mod from_natural;
+mod iterator;
+pub use iterator::*;
+mod mutable;
+pub use mutable::*;
+
+/// A [`PrimitiveArray`] is Arrow's semantically equivalent of an immutable `Vec<Option<T>>` where
+/// T is [`NativeType`] (e.g. [`i32`]). It implements [`Array`].
+///
+/// One way to think about a [`PrimitiveArray`] is `(DataType, Arc<Vec<T>>, Option<Arc<Vec<u8>>>)`
+/// where:
+/// * the first item is the array's logical type
+/// * the second is the immutable values
+/// * the third is the immutable validity (whether a value is null or not as a bitmap).
+///
+/// The size of this struct is `O(1)`, as all data is stored behind an [`std::sync::Arc`].
+/// # Example
+/// ```
+/// use arrow2::array::PrimitiveArray;
+/// use arrow2::bitmap::Bitmap;
+/// use arrow2::buffer::Buffer;
+///
+/// let array = PrimitiveArray::from([Some(1i32), None, Some(10)]);
+/// assert_eq!(array.value(0), 1);
+/// assert_eq!(array.iter().collect::<Vec<_>>(), vec![Some(&1i32), None, Some(&10)]);
+/// assert_eq!(array.values_iter().copied().collect::<Vec<_>>(), vec![1, 0, 10]);
+/// // the underlying representation
+/// assert_eq!(array.values(), &Buffer::from(vec![1i32, 0, 10]));
+/// assert_eq!(array.validity(), Some(&Bitmap::from([true, false, true])));
+///
+/// ```
+#[derive(Clone)]
+pub struct PrimitiveArray<T: NativeType> {
+    data_type: DataType,
+    values: Buffer<T>,
+    validity: Option<Bitmap>,
+}
+
+pub(super) fn check<T: NativeType>(
+    data_type: &DataType,
+    values: &[T],
+    validity_len: Option<usize>,
+) -> Result<(), Error> {
+    if validity_len.map_or(false, |len| len != values.len()) {
+        return Err(Error::oos(
+            "validity mask length must match the number of values",
+        ));
+    }
+
+    if data_type.to_physical_type() != PhysicalType::Primitive(T::PRIMITIVE) {
+        return Err(Error::oos(
+            "PrimitiveArray can only be initialized with a DataType whose physical type is Primitive",
+        ));
+    }
+    Ok(())
+}
+
+impl<T: NativeType> PrimitiveArray<T> {
+    /// The canonical method to create a [`PrimitiveArray`] out of its internal components.
+    /// # Implementation
+    /// This function is `O(1)`.
+    ///
+    /// # Errors
+    /// This function errors iff:
+    /// * The validity is not `None` and its length is different from `values`'s length
+    /// * The `data_type`'s [`PhysicalType`] is not equal to [`PhysicalType::Primitive(T::PRIMITIVE)`]
+    pub fn try_new(
+        data_type: DataType,
+        values: Buffer<T>,
+        validity: Option<Bitmap>,
+    ) -> Result<Self, Error> {
+        check(&data_type, &values, validity.as_ref().map(|v| v.len()))?;
+        Ok(Self {
+            data_type,
+            values,
+            validity,
+        })
+    }
+
+    /// Returns a new [`PrimitiveArray`] with a different logical type.
+    ///
+    /// This function is useful to assign a different [`DataType`] to the array.
+    /// Used to change the arrays' logical type (see example).
+    /// # Example
+    /// ```
+    /// use arrow2::array::Int32Array;
+    /// use arrow2::datatypes::DataType;
+    ///
+    /// let array = Int32Array::from(&[Some(1), None, Some(2)]).to(DataType::Date32);
+    /// assert_eq!(
+    ///    format!("{:?}", array),
+    ///    "Date32[1970-01-02, None, 1970-01-03]"
+    /// );
+    /// ```
+    /// # Panics
+    /// Panics iff the `data_type`'s [`PhysicalType`] is not equal to [`PhysicalType::Primitive(T::PRIMITIVE)`]
+    #[inline]
+    #[must_use]
+    pub fn to(self, data_type: DataType) -> Self {
+        check(
+            &data_type,
+            &self.values,
+            self.validity.as_ref().map(|v| v.len()),
+        )
+        .unwrap();
+        Self {
+            data_type,
+            values: self.values,
+            validity: self.validity,
+        }
+    }
+
+    /// Creates a (non-null) [`PrimitiveArray`] from a vector of values.
+    /// This function is `O(1)`.
+    /// # Examples
+    /// ```
+    /// use arrow2::array::PrimitiveArray;
+    ///
+    /// let array = PrimitiveArray::from_vec(vec![1, 2, 3]);
+    /// assert_eq!(format!("{:?}", array), "Int32[1, 2, 3]");
+    /// ```
+    pub fn from_vec(values: Vec<T>) -> Self {
+        Self::new(T::PRIMITIVE.into(), values.into(), None)
+    }
+
+    /// Returns an iterator over the values and validity, `Option<&T>`.
+    #[inline]
+    pub fn iter(&self) -> ZipValidity<&T, std::slice::Iter<T>, BitmapIter> {
+        ZipValidity::new_with_validity(self.values().iter(), self.validity())
+    }
+
+    /// Returns an iterator of the values, `&T`, ignoring the arrays' validity.
+    #[inline]
+    pub fn values_iter(&self) -> std::slice::Iter<T> {
+        self.values().iter()
+    }
+
+    /// Returns the length of this array
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.values.len()
+    }
+
+    /// The values [`Buffer`].
+    /// Values on null slots are undetermined (they can be anything).
+    #[inline]
+    pub fn values(&self) -> &Buffer<T> {
+        &self.values
+    }
+
+    /// Returns the optional validity.
+    #[inline]
+    pub fn validity(&self) -> Option<&Bitmap> {
+        self.validity.as_ref()
+    }
+
+    /// Returns the arrays' [`DataType`].
+    #[inline]
+    pub fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    /// Returns the value at slot `i`.
+    ///
+    /// Equivalent to `self.values()[i]`. The value of a null slot is undetermined (it can be anything).
+    /// # Panic
+    /// This function panics iff `i >= self.len`.
+    #[inline]
+    pub fn value(&self, i: usize) -> T {
+        self.values[i]
+    }
+
+    /// Returns the value at index `i`.
+    /// The value on null slots is undetermined (it can be anything).
+    /// # Safety
+    /// Caller must be sure that `i < self.len()`
+    #[inline]
+    pub unsafe fn value_unchecked(&self, i: usize) -> T {
+        *self.values.get_unchecked(i)
+    }
+
+    /// Returns the element at index `i` or `None` if it is null
+    /// # Panics
+    /// iff `i >= self.len()`
+    #[inline]
+    pub fn get(&self, i: usize) -> Option<T> {
+        if !self.is_null(i) {
+            // soundness: Array::is_null panics if i >= self.len
+            unsafe { Some(self.value_unchecked(i)) }
+        } else {
+            None
+        }
+    }
+
+    /// Slices this [`PrimitiveArray`] by an offset and length.
+    /// # Implementation
+    /// This operation is `O(1)`.
+    #[inline]
+    pub fn slice(&mut self, offset: usize, length: usize) {
+        assert!(
+            offset + length <= self.len(),
+            "offset + length may not exceed length of array"
+        );
+        unsafe { self.slice_unchecked(offset, length) }
+    }
+
+    /// Slices this [`PrimitiveArray`] by an offset and length.
+    /// # Implementation
+    /// This operation is `O(1)`.
+    /// # Safety
+    /// The caller must ensure that `offset + length <= self.len()`.
+    #[inline]
+    pub unsafe fn slice_unchecked(&mut self, offset: usize, length: usize) {
+        self.validity.as_mut().and_then(|bitmap| {
+            bitmap.slice_unchecked(offset, length);
+            (bitmap.unset_bits() > 0).then(|| bitmap)
+        });
+        self.values.slice_unchecked(offset, length);
+    }
+
+    impl_sliced!();
+    impl_mut_validity!();
+    impl_into_array!();
+
+    /// Returns this [`PrimitiveArray`] with new values.
+    /// # Panics
+    /// This function panics iff `values.len() != self.len()`.
+    #[must_use]
+    pub fn with_values(mut self, values: Buffer<T>) -> Self {
+        self.set_values(values);
+        self
+    }
+
+    /// Update the values of this [`PrimitiveArray`].
+    /// # Panics
+    /// This function panics iff `values.len() != self.len()`.
+    pub fn set_values(&mut self, values: Buffer<T>) {
+        assert_eq!(
+            values.len(),
+            self.len(),
+            "values' length must be equal to this arrays' length"
+        );
+        self.values = values;
+    }
+
+    /// Applies a function `f` to the validity of this array.
+    ///
+    /// This is an API to leverage clone-on-write
+    /// # Panics
+    /// This function panics if the function `f` modifies the length of the [`Bitmap`].
+    pub fn apply_validity<F: FnOnce(Bitmap) -> Bitmap>(&mut self, f: F) {
+        if let Some(validity) = std::mem::take(&mut self.validity) {
+            self.set_validity(Some(f(validity)))
+        }
+    }
+
+    /// Returns an option of a mutable reference to the values of this [`PrimitiveArray`].
+    pub fn get_mut_values(&mut self) -> Option<&mut [T]> {
+        self.values.get_mut_slice()
+    }
+
+    /// Returns its internal representation
+    #[must_use]
+    pub fn into_inner(self) -> (DataType, Buffer<T>, Option<Bitmap>) {
+        let Self {
+            data_type,
+            values,
+            validity,
+        } = self;
+        (data_type, values, validity)
+    }
+
+    /// Creates a `[PrimitiveArray]` from its internal representation.
+    /// This is the inverted from `[PrimitiveArray::into_inner]`
+    pub fn from_inner(
+        data_type: DataType,
+        values: Buffer<T>,
+        validity: Option<Bitmap>,
+    ) -> Result<Self, Error> {
+        check(&data_type, &values, validity.as_ref().map(|v| v.len()))?;
+        Ok(unsafe { Self::from_inner_unchecked(data_type, values, validity) })
+    }
+
+    /// Creates a `[PrimitiveArray]` from its internal representation.
+    /// This is the inverted from `[PrimitiveArray::into_inner]`
+    ///
+    /// # Safety
+    /// Callers must ensure all invariants of this struct are upheld.
+    pub unsafe fn from_inner_unchecked(
+        data_type: DataType,
+        values: Buffer<T>,
+        validity: Option<Bitmap>,
+    ) -> Self {
+        Self {
+            data_type,
+            values,
+            validity,
+        }
+    }
+
+    /// Try to convert this [`PrimitiveArray`] to a [`MutablePrimitiveArray`] via copy-on-write semantics.
+    ///
+    /// A [`PrimitiveArray`] is backed by a [`Buffer`] and [`Bitmap`] which are essentially `Arc<Vec<_>>`.
+    /// This function returns a [`MutablePrimitiveArray`] (via [`std::sync::Arc::get_mut`]) iff both values
+    /// and validity have not been cloned / are unique references to their underlying vectors.
+    ///
+    /// This function is primarily used to re-use memory regions.
+    #[must_use]
+    pub fn into_mut(self) -> Either<Self, MutablePrimitiveArray<T>> {
+        use Either::*;
+
+        if let Some(bitmap) = self.validity {
+            match bitmap.into_mut() {
+                Left(bitmap) => Left(PrimitiveArray::new(
+                    self.data_type,
+                    self.values,
+                    Some(bitmap),
+                )),
+                Right(mutable_bitmap) => match self.values.into_mut() {
+                    Right(values) => Right(
+                        MutablePrimitiveArray::try_new(
+                            self.data_type,
+                            values,
+                            Some(mutable_bitmap),
+                        )
+                        .unwrap(),
+                    ),
+                    Left(values) => Left(PrimitiveArray::new(
+                        self.data_type,
+                        values,
+                        Some(mutable_bitmap.into()),
+                    )),
+                },
+            }
+        } else {
+            match self.values.into_mut() {
+                Right(values) => {
+                    Right(MutablePrimitiveArray::try_new(self.data_type, values, None).unwrap())
+                },
+                Left(values) => Left(PrimitiveArray::new(self.data_type, values, None)),
+            }
+        }
+    }
+
+    /// Returns a new empty (zero-length) [`PrimitiveArray`].
+    pub fn new_empty(data_type: DataType) -> Self {
+        Self::new(data_type, Buffer::new(), None)
+    }
+
+    /// Returns a new [`PrimitiveArray`] where all slots are null / `None`.
+    #[inline]
+    pub fn new_null(data_type: DataType, length: usize) -> Self {
+        Self::new(
+            data_type,
+            vec![T::default(); length].into(),
+            Some(Bitmap::new_zeroed(length)),
+        )
+    }
+
+    /// Creates a (non-null) [`PrimitiveArray`] from an iterator of values.
+    /// # Implementation
+    /// This does not assume that the iterator has a known length.
+    pub fn from_values<I: IntoIterator<Item = T>>(iter: I) -> Self {
+        Self::new(T::PRIMITIVE.into(), Vec::<T>::from_iter(iter).into(), None)
+    }
+
+    /// Creates a (non-null) [`PrimitiveArray`] from a slice of values.
+    /// # Implementation
+    /// This is essentially a memcopy and is thus `O(N)`
+    pub fn from_slice<P: AsRef<[T]>>(slice: P) -> Self {
+        Self::new(
+            T::PRIMITIVE.into(),
+            Vec::<T>::from(slice.as_ref()).into(),
+            None,
+        )
+    }
+
+    /// Creates a (non-null) [`PrimitiveArray`] from a [`TrustedLen`] of values.
+    /// # Implementation
+    /// This does not assume that the iterator has a known length.
+    pub fn from_trusted_len_values_iter<I: TrustedLen<Item = T>>(iter: I) -> Self {
+        MutablePrimitiveArray::<T>::from_trusted_len_values_iter(iter).into()
+    }
+
+    /// Creates a new [`PrimitiveArray`] from an iterator over values
+    /// # Safety
+    /// The iterator must be [`TrustedLen`](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+    /// I.e. that `size_hint().1` correctly reports its length.
+    pub unsafe fn from_trusted_len_values_iter_unchecked<I: Iterator<Item = T>>(iter: I) -> Self {
+        MutablePrimitiveArray::<T>::from_trusted_len_values_iter_unchecked(iter).into()
+    }
+
+    /// Creates a [`PrimitiveArray`] from a [`TrustedLen`] of optional values.
+    pub fn from_trusted_len_iter<I: TrustedLen<Item = Option<T>>>(iter: I) -> Self {
+        MutablePrimitiveArray::<T>::from_trusted_len_iter(iter).into()
+    }
+
+    /// Creates a [`PrimitiveArray`] from an iterator of optional values.
+    /// # Safety
+    /// The iterator must be [`TrustedLen`](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+    /// I.e. that `size_hint().1` correctly reports its length.
+    pub unsafe fn from_trusted_len_iter_unchecked<I: Iterator<Item = Option<T>>>(iter: I) -> Self {
+        MutablePrimitiveArray::<T>::from_trusted_len_iter_unchecked(iter).into()
+    }
+
+    /// Alias for `Self::try_new(..).unwrap()`.
+    /// # Panics
+    /// This function errors iff:
+    /// * The validity is not `None` and its length is different from `values`'s length
+    /// * The `data_type`'s [`PhysicalType`] is not equal to [`PhysicalType::Primitive`].
+    pub fn new(data_type: DataType, values: Buffer<T>, validity: Option<Bitmap>) -> Self {
+        Self::try_new(data_type, values, validity).unwrap()
+    }
+}
+
+impl<T: NativeType> Array for PrimitiveArray<T> {
+    impl_common_array!();
+
+    fn validity(&self) -> Option<&Bitmap> {
+        self.validity.as_ref()
+    }
+
+    #[inline]
+    fn with_validity(&self, validity: Option<Bitmap>) -> Box<dyn Array> {
+        Box::new(self.clone().with_validity(validity))
+    }
+}
+
+/// A type definition [`PrimitiveArray`] for `i8`
+pub type Int8Array = PrimitiveArray<i8>;
+/// A type definition [`PrimitiveArray`] for `i16`
+pub type Int16Array = PrimitiveArray<i16>;
+/// A type definition [`PrimitiveArray`] for `i32`
+pub type Int32Array = PrimitiveArray<i32>;
+/// A type definition [`PrimitiveArray`] for `i64`
+pub type Int64Array = PrimitiveArray<i64>;
+/// A type definition [`PrimitiveArray`] for `i128`
+pub type Int128Array = PrimitiveArray<i128>;
+/// A type definition [`PrimitiveArray`] for `i256`
+pub type Int256Array = PrimitiveArray<i256>;
+/// A type definition [`PrimitiveArray`] for [`days_ms`]
+pub type DaysMsArray = PrimitiveArray<days_ms>;
+/// A type definition [`PrimitiveArray`] for [`months_days_ns`]
+pub type MonthsDaysNsArray = PrimitiveArray<months_days_ns>;
+/// A type definition [`PrimitiveArray`] for `f16`
+pub type Float16Array = PrimitiveArray<f16>;
+/// A type definition [`PrimitiveArray`] for `f32`
+pub type Float32Array = PrimitiveArray<f32>;
+/// A type definition [`PrimitiveArray`] for `f64`
+pub type Float64Array = PrimitiveArray<f64>;
+/// A type definition [`PrimitiveArray`] for `u8`
+pub type UInt8Array = PrimitiveArray<u8>;
+/// A type definition [`PrimitiveArray`] for `u16`
+pub type UInt16Array = PrimitiveArray<u16>;
+/// A type definition [`PrimitiveArray`] for `u32`
+pub type UInt32Array = PrimitiveArray<u32>;
+/// A type definition [`PrimitiveArray`] for `u64`
+pub type UInt64Array = PrimitiveArray<u64>;
+
+/// A type definition [`MutablePrimitiveArray`] for `i8`
+pub type Int8Vec = MutablePrimitiveArray<i8>;
+/// A type definition [`MutablePrimitiveArray`] for `i16`
+pub type Int16Vec = MutablePrimitiveArray<i16>;
+/// A type definition [`MutablePrimitiveArray`] for `i32`
+pub type Int32Vec = MutablePrimitiveArray<i32>;
+/// A type definition [`MutablePrimitiveArray`] for `i64`
+pub type Int64Vec = MutablePrimitiveArray<i64>;
+/// A type definition [`MutablePrimitiveArray`] for `i128`
+pub type Int128Vec = MutablePrimitiveArray<i128>;
+/// A type definition [`MutablePrimitiveArray`] for `i256`
+pub type Int256Vec = MutablePrimitiveArray<i256>;
+/// A type definition [`MutablePrimitiveArray`] for [`days_ms`]
+pub type DaysMsVec = MutablePrimitiveArray<days_ms>;
+/// A type definition [`MutablePrimitiveArray`] for [`months_days_ns`]
+pub type MonthsDaysNsVec = MutablePrimitiveArray<months_days_ns>;
+/// A type definition [`MutablePrimitiveArray`] for `f16`
+pub type Float16Vec = MutablePrimitiveArray<f16>;
+/// A type definition [`MutablePrimitiveArray`] for `f32`
+pub type Float32Vec = MutablePrimitiveArray<f32>;
+/// A type definition [`MutablePrimitiveArray`] for `f64`
+pub type Float64Vec = MutablePrimitiveArray<f64>;
+/// A type definition [`MutablePrimitiveArray`] for `u8`
+pub type UInt8Vec = MutablePrimitiveArray<u8>;
+/// A type definition [`MutablePrimitiveArray`] for `u16`
+pub type UInt16Vec = MutablePrimitiveArray<u16>;
+/// A type definition [`MutablePrimitiveArray`] for `u32`
+pub type UInt32Vec = MutablePrimitiveArray<u32>;
+/// A type definition [`MutablePrimitiveArray`] for `u64`
+pub type UInt64Vec = MutablePrimitiveArray<u64>;
+
+impl<T: NativeType> Default for PrimitiveArray<T> {
+    fn default() -> Self {
+        PrimitiveArray::new(T::PRIMITIVE.into(), Default::default(), None)
+    }
+}
diff --git a/crates/nano-arrow/src/array/primitive/mutable.rs b/crates/nano-arrow/src/array/primitive/mutable.rs
new file mode 100644
index 000000000000..fc61b2e74884
--- /dev/null
+++ b/crates/nano-arrow/src/array/primitive/mutable.rs
@@ -0,0 +1,665 @@
+use std::iter::FromIterator;
+use std::sync::Arc;
+
+use super::{check, PrimitiveArray};
+use crate::array::physical_binary::extend_validity;
+use crate::array::{Array, MutableArray, TryExtend, TryExtendFromSelf, TryPush};
+use crate::bitmap::{Bitmap, MutableBitmap};
+use crate::datatypes::DataType;
+use crate::error::Error;
+use crate::trusted_len::TrustedLen;
+use crate::types::NativeType;
+
+/// The Arrow's equivalent to `Vec<Option<T>>` where `T` is byte-size (e.g. `i32`).
+/// Converting a [`MutablePrimitiveArray`] into a [`PrimitiveArray`] is `O(1)`.
+#[derive(Debug, Clone)]
+pub struct MutablePrimitiveArray<T: NativeType> {
+    data_type: DataType,
+    values: Vec<T>,
+    validity: Option<MutableBitmap>,
+}
+
+impl<T: NativeType> From<MutablePrimitiveArray<T>> for PrimitiveArray<T> {
+    fn from(other: MutablePrimitiveArray<T>) -> Self {
+        let validity = other.validity.and_then(|x| {
+            let bitmap: Bitmap = x.into();
+            if bitmap.unset_bits() == 0 {
+                None
+            } else {
+                Some(bitmap)
+            }
+        });
+
+        PrimitiveArray::<T>::new(other.data_type, other.values.into(), validity)
+    }
+}
+
+impl<T: NativeType, P: AsRef<[Option<T>]>> From<P> for MutablePrimitiveArray<T> {
+    fn from(slice: P) -> Self {
+        Self::from_trusted_len_iter(slice.as_ref().iter().map(|x| x.as_ref()))
+    }
+}
+
+impl<T: NativeType> MutablePrimitiveArray<T> {
+    /// Creates a new empty [`MutablePrimitiveArray`].
+    pub fn new() -> Self {
+        Self::with_capacity(0)
+    }
+
+    /// Creates a new [`MutablePrimitiveArray`] with a capacity.
+    pub fn with_capacity(capacity: usize) -> Self {
+        Self::with_capacity_from(capacity, T::PRIMITIVE.into())
+    }
+
+    /// The canonical method to create a [`MutablePrimitiveArray`] out of its internal components.
+    /// # Implementation
+    /// This function is `O(1)`.
+    ///
+    /// # Errors
+    /// This function errors iff:
+    /// * The validity is not `None` and its length is different from `values`'s length
+    /// * The `data_type`'s [`crate::datatypes::PhysicalType`] is not equal to [`crate::datatypes::PhysicalType::Primitive(T::PRIMITIVE)`]
+    pub fn try_new(
+        data_type: DataType,
+        values: Vec<T>,
+        validity: Option<MutableBitmap>,
+    ) -> Result<Self, Error> {
+        check(&data_type, &values, validity.as_ref().map(|x| x.len()))?;
+        Ok(Self {
+            data_type,
+            values,
+            validity,
+        })
+    }
+
+    /// Extract the low-end APIs from the [`MutablePrimitiveArray`].
+    pub fn into_inner(self) -> (DataType, Vec<T>, Option<MutableBitmap>) {
+        (self.data_type, self.values, self.validity)
+    }
+
+    /// Applies a function `f` to the values of this array, cloning the values
+    /// iff they are being shared with others
+    ///
+    /// This is an API to use clone-on-write
+    /// # Implementation
+    /// This function is `O(f)` if the data is not being shared, and `O(N) + O(f)`
+    /// if it is being shared (since it results in a `O(N)` memcopy).
+    /// # Panics
+    /// This function panics iff `f` panics
+    pub fn apply_values<F: Fn(&mut [T])>(&mut self, f: F) {
+        f(&mut self.values);
+    }
+}
+
+impl<T: NativeType> Default for MutablePrimitiveArray<T> {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl<T: NativeType> From<DataType> for MutablePrimitiveArray<T> {
+    fn from(data_type: DataType) -> Self {
+        assert!(data_type.to_physical_type().eq_primitive(T::PRIMITIVE));
+        Self {
+            data_type,
+            values: Vec::<T>::new(),
+            validity: None,
+        }
+    }
+}
+
+impl<T: NativeType> MutablePrimitiveArray<T> {
+    /// Creates a new [`MutablePrimitiveArray`] from a capacity and [`DataType`].
+    pub fn with_capacity_from(capacity: usize, data_type: DataType) -> Self {
+        assert!(data_type.to_physical_type().eq_primitive(T::PRIMITIVE));
+        Self {
+            data_type,
+            values: Vec::<T>::with_capacity(capacity),
+            validity: None,
+        }
+    }
+
+    /// Reserves `additional` entries.
+    pub fn reserve(&mut self, additional: usize) {
+        self.values.reserve(additional);
+        if let Some(x) = self.validity.as_mut() {
+            x.reserve(additional)
+        }
+    }
+
+    /// Adds a new value to the array.
+    #[inline]
+    pub fn push(&mut self, value: Option<T>) {
+        match value {
+            Some(value) => {
+                self.values.push(value);
+                match &mut self.validity {
+                    Some(validity) => validity.push(true),
+                    None => {},
+                }
+            },
+            None => {
+                self.values.push(T::default());
+                match &mut self.validity {
+                    Some(validity) => validity.push(false),
+                    None => {
+                        self.init_validity();
+                    },
+                }
+            },
+        }
+    }
+
+    /// Pop a value from the array.
+    /// Note if the values is empty, this method will return None.
+    pub fn pop(&mut self) -> Option<T> {
+        let value = self.values.pop()?;
+        self.validity
+            .as_mut()
+            .map(|x| x.pop()?.then(|| value))
+            .unwrap_or_else(|| Some(value))
+    }
+
+    /// Extends the [`MutablePrimitiveArray`] with a constant
+    #[inline]
+    pub fn extend_constant(&mut self, additional: usize, value: Option<T>) {
+        if let Some(value) = value {
+            self.values.resize(self.values.len() + additional, value);
+            if let Some(validity) = &mut self.validity {
+                validity.extend_constant(additional, true)
+            }
+        } else {
+            if let Some(validity) = &mut self.validity {
+                validity.extend_constant(additional, false)
+            } else {
+                let mut validity = MutableBitmap::with_capacity(self.values.capacity());
+                validity.extend_constant(self.len(), true);
+                validity.extend_constant(additional, false);
+                self.validity = Some(validity)
+            }
+            self.values
+                .resize(self.values.len() + additional, T::default());
+        }
+    }
+
+    /// Extends the [`MutablePrimitiveArray`] from an iterator of trusted len.
+    #[inline]
+    pub fn extend_trusted_len<P, I>(&mut self, iterator: I)
+    where
+        P: std::borrow::Borrow<T>,
+        I: TrustedLen<Item = Option<P>>,
+    {
+        unsafe { self.extend_trusted_len_unchecked(iterator) }
+    }
+
+    /// Extends the [`MutablePrimitiveArray`] from an iterator of trusted len.
+    /// # Safety
+    /// The iterator must be trusted len.
+    #[inline]
+    pub unsafe fn extend_trusted_len_unchecked<P, I>(&mut self, iterator: I)
+    where
+        P: std::borrow::Borrow<T>,
+        I: Iterator<Item = Option<P>>,
+    {
+        if let Some(validity) = self.validity.as_mut() {
+            extend_trusted_len_unzip(iterator, validity, &mut self.values)
+        } else {
+            let mut validity = MutableBitmap::new();
+            validity.extend_constant(self.len(), true);
+            extend_trusted_len_unzip(iterator, &mut validity, &mut self.values);
+            self.validity = Some(validity);
+        }
+    }
+    /// Extends the [`MutablePrimitiveArray`] from an iterator of values of trusted len.
+    /// This differs from `extend_trusted_len` which accepts in iterator of optional values.
+    #[inline]
+    pub fn extend_trusted_len_values<I>(&mut self, iterator: I)
+    where
+        I: TrustedLen<Item = T>,
+    {
+        unsafe { self.extend_trusted_len_values_unchecked(iterator) }
+    }
+
+    /// Extends the [`MutablePrimitiveArray`] from an iterator of values of trusted len.
+    /// This differs from `extend_trusted_len_unchecked` which accepts in iterator of optional values.
+    /// # Safety
+    /// The iterator must be trusted len.
+    #[inline]
+    pub unsafe fn extend_trusted_len_values_unchecked<I>(&mut self, iterator: I)
+    where
+        I: Iterator<Item = T>,
+    {
+        self.values.extend(iterator);
+        self.update_all_valid();
+    }
+
+    #[inline]
+    /// Extends the [`MutablePrimitiveArray`] from a slice
+    pub fn extend_from_slice(&mut self, items: &[T]) {
+        self.values.extend_from_slice(items);
+        self.update_all_valid();
+    }
+
+    fn update_all_valid(&mut self) {
+        // get len before mutable borrow
+        let len = self.len();
+        if let Some(validity) = self.validity.as_mut() {
+            validity.extend_constant(len - validity.len(), true);
+        }
+    }
+
+    fn init_validity(&mut self) {
+        let mut validity = MutableBitmap::with_capacity(self.values.capacity());
+        validity.extend_constant(self.len(), true);
+        validity.set(self.len() - 1, false);
+        self.validity = Some(validity)
+    }
+
+    /// Changes the arrays' [`DataType`], returning a new [`MutablePrimitiveArray`].
+    /// Use to change the logical type without changing the corresponding physical Type.
+    /// # Implementation
+    /// This operation is `O(1)`.
+    #[inline]
+    pub fn to(self, data_type: DataType) -> Self {
+        Self::try_new(data_type, self.values, self.validity).unwrap()
+    }
+
+    /// Converts itself into an [`Array`].
+    pub fn into_arc(self) -> Arc<dyn Array> {
+        let a: PrimitiveArray<T> = self.into();
+        Arc::new(a)
+    }
+
+    /// Shrinks the capacity of the [`MutablePrimitiveArray`] to fit its current length.
+    pub fn shrink_to_fit(&mut self) {
+        self.values.shrink_to_fit();
+        if let Some(validity) = &mut self.validity {
+            validity.shrink_to_fit()
+        }
+    }
+
+    /// Returns the capacity of this [`MutablePrimitiveArray`].
+    pub fn capacity(&self) -> usize {
+        self.values.capacity()
+    }
+}
+
+/// Accessors
+impl<T: NativeType> MutablePrimitiveArray<T> {
+    /// Returns its values.
+    pub fn values(&self) -> &Vec<T> {
+        &self.values
+    }
+
+    /// Returns a mutable slice of values.
+    pub fn values_mut_slice(&mut self) -> &mut [T] {
+        self.values.as_mut_slice()
+    }
+}
+
+/// Setters
+impl<T: NativeType> MutablePrimitiveArray<T> {
+    /// Sets position `index` to `value`.
+    /// Note that if it is the first time a null appears in this array,
+    /// this initializes the validity bitmap (`O(N)`).
+    /// # Panic
+    /// Panics iff index is larger than `self.len()`.
+    pub fn set(&mut self, index: usize, value: Option<T>) {
+        assert!(index < self.len());
+        // Safety:
+        // we just checked bounds
+        unsafe { self.set_unchecked(index, value) }
+    }
+
+    /// Sets position `index` to `value`.
+    /// Note that if it is the first time a null appears in this array,
+    /// this initializes the validity bitmap (`O(N)`).
+    /// # Safety
+    /// Caller must ensure `index < self.len()`
+    pub unsafe fn set_unchecked(&mut self, index: usize, value: Option<T>) {
+        *self.values.get_unchecked_mut(index) = value.unwrap_or_default();
+
+        if value.is_none() && self.validity.is_none() {
+            // When the validity is None, all elements so far are valid. When one of the elements is set of null,
+            // the validity must be initialized.
+            let mut validity = MutableBitmap::new();
+            validity.extend_constant(self.len(), true);
+            self.validity = Some(validity);
+        }
+        if let Some(x) = self.validity.as_mut() {
+            x.set_unchecked(index, value.is_some())
+        }
+    }
+
+    /// Sets the validity.
+    /// # Panic
+    /// Panics iff the validity's len is not equal to the existing values' length.
+    pub fn set_validity(&mut self, validity: Option<MutableBitmap>) {
+        if let Some(validity) = &validity {
+            assert_eq!(self.values.len(), validity.len())
+        }
+        self.validity = validity;
+    }
+
+    /// Sets values.
+    /// # Panic
+    /// Panics iff the values' length is not equal to the existing validity's len.
+    pub fn set_values(&mut self, values: Vec<T>) {
+        assert_eq!(values.len(), self.values.len());
+        self.values = values;
+    }
+}
+
+impl<T: NativeType> Extend<Option<T>> for MutablePrimitiveArray<T> {
+    fn extend<I: IntoIterator<Item = Option<T>>>(&mut self, iter: I) {
+        let iter = iter.into_iter();
+        self.reserve(iter.size_hint().0);
+        iter.for_each(|x| self.push(x))
+    }
+}
+
+impl<T: NativeType> TryExtend<Option<T>> for MutablePrimitiveArray<T> {
+    /// This is infalible and is implemented for consistency with all other types
+    fn try_extend<I: IntoIterator<Item = Option<T>>>(&mut self, iter: I) -> Result<(), Error> {
+        self.extend(iter);
+        Ok(())
+    }
+}
+
+impl<T: NativeType> TryPush<Option<T>> for MutablePrimitiveArray<T> {
+    /// This is infalible and is implemented for consistency with all other types
+    fn try_push(&mut self, item: Option<T>) -> Result<(), Error> {
+        self.push(item);
+        Ok(())
+    }
+}
+
+impl<T: NativeType> MutableArray for MutablePrimitiveArray<T> {
+    fn len(&self) -> usize {
+        self.values.len()
+    }
+
+    fn validity(&self) -> Option<&MutableBitmap> {
+        self.validity.as_ref()
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        PrimitiveArray::new(
+            self.data_type.clone(),
+            std::mem::take(&mut self.values).into(),
+            std::mem::take(&mut self.validity).map(|x| x.into()),
+        )
+        .boxed()
+    }
+
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        PrimitiveArray::new(
+            self.data_type.clone(),
+            std::mem::take(&mut self.values).into(),
+            std::mem::take(&mut self.validity).map(|x| x.into()),
+        )
+        .arced()
+    }
+
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    fn as_mut_any(&mut self) -> &mut dyn std::any::Any {
+        self
+    }
+
+    fn push_null(&mut self) {
+        self.push(None)
+    }
+
+    fn reserve(&mut self, additional: usize) {
+        self.reserve(additional)
+    }
+
+    fn shrink_to_fit(&mut self) {
+        self.shrink_to_fit()
+    }
+}
+
+impl<T: NativeType> MutablePrimitiveArray<T> {
+    /// Creates a [`MutablePrimitiveArray`] from a slice of values.
+    pub fn from_slice<P: AsRef<[T]>>(slice: P) -> Self {
+        Self::from_trusted_len_values_iter(slice.as_ref().iter().copied())
+    }
+
+    /// Creates a [`MutablePrimitiveArray`] from an iterator of trusted length.
+    /// # Safety
+    /// The iterator must be [`TrustedLen`](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+    /// I.e. `size_hint().1` correctly reports its length.
+    #[inline]
+    pub unsafe fn from_trusted_len_iter_unchecked<I, P>(iterator: I) -> Self
+    where
+        P: std::borrow::Borrow<T>,
+        I: Iterator<Item = Option<P>>,
+    {
+        let (validity, values) = trusted_len_unzip(iterator);
+
+        Self {
+            data_type: T::PRIMITIVE.into(),
+            values,
+            validity,
+        }
+    }
+
+    /// Creates a [`MutablePrimitiveArray`] from a [`TrustedLen`].
+    #[inline]
+    pub fn from_trusted_len_iter<I, P>(iterator: I) -> Self
+    where
+        P: std::borrow::Borrow<T>,
+        I: TrustedLen<Item = Option<P>>,
+    {
+        unsafe { Self::from_trusted_len_iter_unchecked(iterator) }
+    }
+
+    /// Creates a [`MutablePrimitiveArray`] from an fallible iterator of trusted length.
+    /// # Safety
+    /// The iterator must be [`TrustedLen`](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+    /// I.e. that `size_hint().1` correctly reports its length.
+    #[inline]
+    pub unsafe fn try_from_trusted_len_iter_unchecked<E, I, P>(
+        iter: I,
+    ) -> std::result::Result<Self, E>
+    where
+        P: std::borrow::Borrow<T>,
+        I: IntoIterator<Item = std::result::Result<Option<P>, E>>,
+    {
+        let iterator = iter.into_iter();
+
+        let (validity, values) = try_trusted_len_unzip(iterator)?;
+
+        Ok(Self {
+            data_type: T::PRIMITIVE.into(),
+            values,
+            validity,
+        })
+    }
+
+    /// Creates a [`MutablePrimitiveArray`] from an fallible iterator of trusted length.
+    #[inline]
+    pub fn try_from_trusted_len_iter<E, I, P>(iterator: I) -> std::result::Result<Self, E>
+    where
+        P: std::borrow::Borrow<T>,
+        I: TrustedLen<Item = std::result::Result<Option<P>, E>>,
+    {
+        unsafe { Self::try_from_trusted_len_iter_unchecked(iterator) }
+    }
+
+    /// Creates a new [`MutablePrimitiveArray`] out an iterator over values
+    pub fn from_trusted_len_values_iter<I: TrustedLen<Item = T>>(iter: I) -> Self {
+        Self {
+            data_type: T::PRIMITIVE.into(),
+            values: iter.collect(),
+            validity: None,
+        }
+    }
+
+    /// Creates a (non-null) [`MutablePrimitiveArray`] from a vector of values.
+    /// This does not have memcopy and is the fastest way to create a [`PrimitiveArray`].
+    pub fn from_vec(values: Vec<T>) -> Self {
+        Self::try_new(T::PRIMITIVE.into(), values, None).unwrap()
+    }
+
+    /// Creates a new [`MutablePrimitiveArray`] from an iterator over values
+    /// # Safety
+    /// The iterator must be [`TrustedLen`](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+    /// I.e. that `size_hint().1` correctly reports its length.
+    pub unsafe fn from_trusted_len_values_iter_unchecked<I: Iterator<Item = T>>(iter: I) -> Self {
+        Self {
+            data_type: T::PRIMITIVE.into(),
+            values: iter.collect(),
+            validity: None,
+        }
+    }
+}
+
+impl<T: NativeType, Ptr: std::borrow::Borrow<Option<T>>> FromIterator<Ptr>
+    for MutablePrimitiveArray<T>
+{
+    fn from_iter<I: IntoIterator<Item = Ptr>>(iter: I) -> Self {
+        let iter = iter.into_iter();
+        let (lower, _) = iter.size_hint();
+
+        let mut validity = MutableBitmap::with_capacity(lower);
+
+        let values: Vec<T> = iter
+            .map(|item| {
+                if let Some(a) = item.borrow() {
+                    validity.push(true);
+                    *a
+                } else {
+                    validity.push(false);
+                    T::default()
+                }
+            })
+            .collect();
+
+        let validity = Some(validity);
+
+        Self {
+            data_type: T::PRIMITIVE.into(),
+            values,
+            validity,
+        }
+    }
+}
+
+/// Extends a [`MutableBitmap`] and a [`Vec`] from an iterator of `Option`.
+/// The first buffer corresponds to a bitmap buffer, the second one
+/// corresponds to a values buffer.
+/// # Safety
+/// The caller must ensure that `iterator` is `TrustedLen`.
+#[inline]
+pub(crate) unsafe fn extend_trusted_len_unzip<I, P, T>(
+    iterator: I,
+    validity: &mut MutableBitmap,
+    buffer: &mut Vec<T>,
+) where
+    T: NativeType,
+    P: std::borrow::Borrow<T>,
+    I: Iterator<Item = Option<P>>,
+{
+    let (_, upper) = iterator.size_hint();
+    let additional = upper.expect("trusted_len_unzip requires an upper limit");
+
+    validity.reserve(additional);
+    let values = iterator.map(|item| {
+        if let Some(item) = item {
+            validity.push_unchecked(true);
+            *item.borrow()
+        } else {
+            validity.push_unchecked(false);
+            T::default()
+        }
+    });
+    buffer.extend(values);
+}
+
+/// Creates a [`MutableBitmap`] and a [`Vec`] from an iterator of `Option`.
+/// The first buffer corresponds to a bitmap buffer, the second one
+/// corresponds to a values buffer.
+/// # Safety
+/// The caller must ensure that `iterator` is `TrustedLen`.
+#[inline]
+pub(crate) unsafe fn trusted_len_unzip<I, P, T>(iterator: I) -> (Option<MutableBitmap>, Vec<T>)
+where
+    T: NativeType,
+    P: std::borrow::Borrow<T>,
+    I: Iterator<Item = Option<P>>,
+{
+    let mut validity = MutableBitmap::new();
+    let mut buffer = Vec::<T>::new();
+
+    extend_trusted_len_unzip(iterator, &mut validity, &mut buffer);
+
+    let validity = Some(validity);
+
+    (validity, buffer)
+}
+
+/// # Safety
+/// The caller must ensure that `iterator` is `TrustedLen`.
+#[inline]
+pub(crate) unsafe fn try_trusted_len_unzip<E, I, P, T>(
+    iterator: I,
+) -> std::result::Result<(Option<MutableBitmap>, Vec<T>), E>
+where
+    T: NativeType,
+    P: std::borrow::Borrow<T>,
+    I: Iterator<Item = std::result::Result<Option<P>, E>>,
+{
+    let (_, upper) = iterator.size_hint();
+    let len = upper.expect("trusted_len_unzip requires an upper limit");
+
+    let mut null = MutableBitmap::with_capacity(len);
+    let mut buffer = Vec::<T>::with_capacity(len);
+
+    let mut dst = buffer.as_mut_ptr();
+    for item in iterator {
+        let item = if let Some(item) = item? {
+            null.push(true);
+            *item.borrow()
+        } else {
+            null.push(false);
+            T::default()
+        };
+        std::ptr::write(dst, item);
+        dst = dst.add(1);
+    }
+    assert_eq!(
+        dst.offset_from(buffer.as_ptr()) as usize,
+        len,
+        "Trusted iterator length was not accurately reported"
+    );
+    buffer.set_len(len);
+    null.set_len(len);
+
+    let validity = Some(null);
+
+    Ok((validity, buffer))
+}
+
+impl<T: NativeType> PartialEq for MutablePrimitiveArray<T> {
+    fn eq(&self, other: &Self) -> bool {
+        self.iter().eq(other.iter())
+    }
+}
+
+impl<T: NativeType> TryExtendFromSelf for MutablePrimitiveArray<T> {
+    fn try_extend_from_self(&mut self, other: &Self) -> Result<(), Error> {
+        extend_validity(self.len(), &mut self.validity, &other.validity);
+
+        let slice = other.values.as_slice();
+        self.values.extend_from_slice(slice);
+        Ok(())
+    }
+}
diff --git a/crates/nano-arrow/src/array/specification.rs b/crates/nano-arrow/src/array/specification.rs
new file mode 100644
index 000000000000..efa8fe1be4a4
--- /dev/null
+++ b/crates/nano-arrow/src/array/specification.rs
@@ -0,0 +1,178 @@
+use crate::array::DictionaryKey;
+use crate::error::{Error, Result};
+use crate::offset::{Offset, Offsets, OffsetsBuffer};
+
+/// Helper trait to support `Offset` and `OffsetBuffer`
+pub(crate) trait OffsetsContainer<O> {
+    fn last(&self) -> usize;
+    fn as_slice(&self) -> &[O];
+}
+
+impl<O: Offset> OffsetsContainer<O> for OffsetsBuffer<O> {
+    #[inline]
+    fn last(&self) -> usize {
+        self.last().to_usize()
+    }
+
+    #[inline]
+    fn as_slice(&self) -> &[O] {
+        self.buffer()
+    }
+}
+
+impl<O: Offset> OffsetsContainer<O> for Offsets<O> {
+    #[inline]
+    fn last(&self) -> usize {
+        self.last().to_usize()
+    }
+
+    #[inline]
+    fn as_slice(&self) -> &[O] {
+        self.as_slice()
+    }
+}
+
+pub(crate) fn try_check_offsets_bounds<O: Offset, C: OffsetsContainer<O>>(
+    offsets: &C,
+    values_len: usize,
+) -> Result<()> {
+    if offsets.last() > values_len {
+        Err(Error::oos("offsets must not exceed the values length"))
+    } else {
+        Ok(())
+    }
+}
+
+/// # Error
+/// * any offset is larger or equal to `values_len`.
+/// * any slice of `values` between two consecutive pairs from `offsets` is invalid `utf8`, or
+pub(crate) fn try_check_utf8<O: Offset, C: OffsetsContainer<O>>(
+    offsets: &C,
+    values: &[u8],
+) -> Result<()> {
+    if offsets.as_slice().len() == 1 {
+        return Ok(());
+    }
+
+    try_check_offsets_bounds(offsets, values.len())?;
+
+    if values.is_ascii() {
+        Ok(())
+    } else {
+        simdutf8::basic::from_utf8(values)?;
+
+        // offsets can be == values.len()
+        // find first offset from the end that is smaller
+        // Example:
+        // values.len() = 10
+        // offsets = [0, 5, 10, 10]
+        let offsets = offsets.as_slice();
+        let last = offsets
+            .iter()
+            .enumerate()
+            .skip(1)
+            .rev()
+            .find_map(|(i, offset)| (offset.to_usize() < values.len()).then(|| i));
+
+        let last = if let Some(last) = last {
+            // following the example: last = 1 (offset = 5)
+            last
+        } else {
+            // given `l = values.len()`, this branch is hit iff either:
+            // * `offsets = [0, l, l, ...]`, which was covered by `from_utf8(values)` above
+            // * `offsets = [0]`, which never happens because offsets.as_slice().len() == 1 is short-circuited above
+            return Ok(());
+        };
+
+        // truncate to relevant offsets. Note: `=last` because last was computed skipping the first item
+        // following the example: starts = [0, 5]
+        let starts = unsafe { offsets.get_unchecked(..=last) };
+
+        let mut any_invalid = false;
+        for start in starts {
+            let start = start.to_usize();
+
+            // Safety: `try_check_offsets_bounds` just checked for bounds
+            let b = *unsafe { values.get_unchecked(start) };
+
+            // A valid code-point iff it does not start with 0b10xxxxxx
+            // Bit-magic taken from `std::str::is_char_boundary`
+            if (b as i8) < -0x40 {
+                any_invalid = true
+            }
+        }
+        if any_invalid {
+            return Err(Error::oos("Non-valid char boundary detected"));
+        }
+        Ok(())
+    }
+}
+
+/// Check dictionary indexes without checking usize conversion.
+/// # Safety
+/// The caller must ensure that `K::as_usize` always succeeds.
+pub(crate) unsafe fn check_indexes_unchecked<K: DictionaryKey>(
+    keys: &[K],
+    len: usize,
+) -> Result<()> {
+    let mut invalid = false;
+
+    // this loop is auto-vectorized
+    keys.iter().for_each(|k| {
+        if k.as_usize() > len {
+            invalid = true;
+        }
+    });
+
+    if invalid {
+        let key = keys.iter().map(|k| k.as_usize()).max().unwrap();
+        Err(Error::oos(format!("One of the dictionary keys is {key} but it must be < than the length of the dictionary values, which is {len}")))
+    } else {
+        Ok(())
+    }
+}
+
+pub fn check_indexes<K>(keys: &[K], len: usize) -> Result<()>
+where
+    K: std::fmt::Debug + Copy + TryInto<usize>,
+{
+    keys.iter().try_for_each(|key| {
+        let key: usize = (*key)
+            .try_into()
+            .map_err(|_| Error::oos(format!("The dictionary key must fit in a `usize`, but {key:?} does not")))?;
+        if key >= len {
+            Err(Error::oos(format!("One of the dictionary keys is {key} but it must be < than the length of the dictionary values, which is {len}")))
+        } else {
+            Ok(())
+        }
+    })
+}
+
+#[cfg(test)]
+mod tests {
+    use proptest::prelude::*;
+
+    use super::*;
+
+    pub(crate) fn binary_strategy() -> impl Strategy<Value = Vec<u8>> {
+        prop::collection::vec(any::<u8>(), 1..100)
+    }
+
+    proptest! {
+        // a bit expensive, feel free to run it when changing the code above
+        // #![proptest_config(ProptestConfig::with_cases(100000))]
+        #[test]
+        #[cfg_attr(miri, ignore)] // miri and proptest do not work well
+        fn check_utf8_validation(values in binary_strategy()) {
+
+            for offset in 0..values.len() - 1 {
+                let offsets = vec![0, offset as i32, values.len() as i32].try_into().unwrap();
+
+                let mut is_valid = std::str::from_utf8(&values[..offset]).is_ok();
+                is_valid &= std::str::from_utf8(&values[offset..]).is_ok();
+
+                assert_eq!(try_check_utf8::<i32, Offsets<i32>>(&offsets, &values).is_ok(), is_valid)
+            }
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/array/struct_/data.rs b/crates/nano-arrow/src/array/struct_/data.rs
new file mode 100644
index 000000000000..b96dc4ffe28b
--- /dev/null
+++ b/crates/nano-arrow/src/array/struct_/data.rs
@@ -0,0 +1,28 @@
+use arrow_data::{ArrayData, ArrayDataBuilder};
+
+use crate::array::{from_data, to_data, Arrow2Arrow, StructArray};
+use crate::bitmap::Bitmap;
+
+impl Arrow2Arrow for StructArray {
+    fn to_data(&self) -> ArrayData {
+        let data_type = self.data_type.clone().into();
+
+        let builder = ArrayDataBuilder::new(data_type)
+            .len(self.len())
+            .nulls(self.validity.as_ref().map(|b| b.clone().into()))
+            .child_data(self.values.iter().map(|x| to_data(x.as_ref())).collect());
+
+        // Safety: Array is valid
+        unsafe { builder.build_unchecked() }
+    }
+
+    fn from_data(data: &ArrayData) -> Self {
+        let data_type = data.data_type().clone().into();
+
+        Self {
+            data_type,
+            values: data.child_data().iter().map(from_data).collect(),
+            validity: data.nulls().map(|n| Bitmap::from_null_buffer(n.clone())),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/array/struct_/ffi.rs b/crates/nano-arrow/src/array/struct_/ffi.rs
new file mode 100644
index 000000000000..95abe00694b2
--- /dev/null
+++ b/crates/nano-arrow/src/array/struct_/ffi.rs
@@ -0,0 +1,72 @@
+use super::super::ffi::ToFfi;
+use super::super::{Array, FromFfi};
+use super::StructArray;
+use crate::error::Result;
+use crate::ffi;
+
+unsafe impl ToFfi for StructArray {
+    fn buffers(&self) -> Vec<Option<*const u8>> {
+        vec![self.validity.as_ref().map(|x| x.as_ptr())]
+    }
+
+    fn children(&self) -> Vec<Box<dyn Array>> {
+        self.values.clone()
+    }
+
+    fn offset(&self) -> Option<usize> {
+        Some(
+            self.validity
+                .as_ref()
+                .map(|bitmap| bitmap.offset())
+                .unwrap_or_default(),
+        )
+    }
+
+    fn to_ffi_aligned(&self) -> Self {
+        self.clone()
+    }
+}
+
+impl<A: ffi::ArrowArrayRef> FromFfi<A> for StructArray {
+    unsafe fn try_from_ffi(array: A) -> Result<Self> {
+        let data_type = array.data_type().clone();
+        let fields = Self::get_fields(&data_type);
+
+        let arrow_array = array.array();
+        let validity = unsafe { array.validity() }?;
+        let len = arrow_array.len();
+        let offset = arrow_array.offset();
+        let values = (0..fields.len())
+            .map(|index| {
+                let child = array.child(index)?;
+                ffi::try_from(child).map(|arr| {
+                    // there is a discrepancy with how arrow2 exports sliced
+                    // struct array and how pyarrow does it.
+                    // # Pyarrow
+                    // ## struct array len 3
+                    //  * slice 1 by with len 2
+                    //      offset on struct array: 1
+                    //      length on struct array: 2
+                    //      offset on value array: 0
+                    //      length on value array: 3
+                    // # Arrow2
+                    // ## struct array len 3
+                    //  * slice 1 by with len 2
+                    //      offset on struct array: 0
+                    //      length on struct array: 3
+                    //      offset on value array: 1
+                    //      length on value array: 2
+                    //
+                    // this branch will ensure both can round trip
+                    if arr.len() >= (len + offset) {
+                        arr.sliced(offset, len)
+                    } else {
+                        arr
+                    }
+                })
+            })
+            .collect::<Result<Vec<Box<dyn Array>>>>()?;
+
+        Self::try_new(data_type, values, validity)
+    }
+}
diff --git a/crates/nano-arrow/src/array/struct_/fmt.rs b/crates/nano-arrow/src/array/struct_/fmt.rs
new file mode 100644
index 000000000000..999cd8b67e08
--- /dev/null
+++ b/crates/nano-arrow/src/array/struct_/fmt.rs
@@ -0,0 +1,34 @@
+use std::fmt::{Debug, Formatter, Result, Write};
+
+use super::super::fmt::{get_display, write_map, write_vec};
+use super::StructArray;
+
+pub fn write_value<W: Write>(
+    array: &StructArray,
+    index: usize,
+    null: &'static str,
+    f: &mut W,
+) -> Result {
+    let writer = |f: &mut W, _index| {
+        for (i, (field, column)) in array.fields().iter().zip(array.values()).enumerate() {
+            if i != 0 {
+                write!(f, ", ")?;
+            }
+            let writer = get_display(column.as_ref(), null);
+            write!(f, "{}: ", field.name)?;
+            writer(f, index)?;
+        }
+        Ok(())
+    };
+
+    write_map(f, writer, None, 1, null, false)
+}
+
+impl Debug for StructArray {
+    fn fmt(&self, f: &mut Formatter<'_>) -> Result {
+        let writer = |f: &mut Formatter, index| write_value(self, index, "None", f);
+
+        write!(f, "StructArray")?;
+        write_vec(f, writer, self.validity(), self.len(), "None", false)
+    }
+}
diff --git a/crates/nano-arrow/src/array/struct_/iterator.rs b/crates/nano-arrow/src/array/struct_/iterator.rs
new file mode 100644
index 000000000000..cb8e6aafbb09
--- /dev/null
+++ b/crates/nano-arrow/src/array/struct_/iterator.rs
@@ -0,0 +1,96 @@
+use super::StructArray;
+use crate::bitmap::utils::{BitmapIter, ZipValidity};
+use crate::scalar::{new_scalar, Scalar};
+use crate::trusted_len::TrustedLen;
+
+pub struct StructValueIter<'a> {
+    array: &'a StructArray,
+    index: usize,
+    end: usize,
+}
+
+impl<'a> StructValueIter<'a> {
+    #[inline]
+    pub fn new(array: &'a StructArray) -> Self {
+        Self {
+            array,
+            index: 0,
+            end: array.len(),
+        }
+    }
+}
+
+impl<'a> Iterator for StructValueIter<'a> {
+    type Item = Vec<Box<dyn Scalar>>;
+
+    #[inline]
+    fn next(&mut self) -> Option<Self::Item> {
+        if self.index == self.end {
+            return None;
+        }
+        let old = self.index;
+        self.index += 1;
+
+        // Safety:
+        // self.end is maximized by the length of the array
+        Some(
+            self.array
+                .values()
+                .iter()
+                .map(|v| new_scalar(v.as_ref(), old))
+                .collect(),
+        )
+    }
+
+    #[inline]
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        (self.end - self.index, Some(self.end - self.index))
+    }
+}
+
+unsafe impl<'a> TrustedLen for StructValueIter<'a> {}
+
+impl<'a> DoubleEndedIterator for StructValueIter<'a> {
+    #[inline]
+    fn next_back(&mut self) -> Option<Self::Item> {
+        if self.index == self.end {
+            None
+        } else {
+            self.end -= 1;
+
+            // Safety:
+            // self.end is maximized by the length of the array
+            Some(
+                self.array
+                    .values()
+                    .iter()
+                    .map(|v| new_scalar(v.as_ref(), self.end))
+                    .collect(),
+            )
+        }
+    }
+}
+
+type ValuesIter<'a> = StructValueIter<'a>;
+type ZipIter<'a> = ZipValidity<Vec<Box<dyn Scalar>>, ValuesIter<'a>, BitmapIter<'a>>;
+
+impl<'a> IntoIterator for &'a StructArray {
+    type Item = Option<Vec<Box<dyn Scalar>>>;
+    type IntoIter = ZipIter<'a>;
+
+    fn into_iter(self) -> Self::IntoIter {
+        self.iter()
+    }
+}
+
+impl<'a> StructArray {
+    /// Returns an iterator of `Option<Box<dyn Array>>`
+    pub fn iter(&'a self) -> ZipIter<'a> {
+        ZipValidity::new_with_validity(StructValueIter::new(self), self.validity())
+    }
+
+    /// Returns an iterator of `Box<dyn Array>`
+    pub fn values_iter(&'a self) -> ValuesIter<'a> {
+        StructValueIter::new(self)
+    }
+}
diff --git a/crates/nano-arrow/src/array/struct_/mod.rs b/crates/nano-arrow/src/array/struct_/mod.rs
new file mode 100644
index 000000000000..e38597036574
--- /dev/null
+++ b/crates/nano-arrow/src/array/struct_/mod.rs
@@ -0,0 +1,254 @@
+use super::{new_empty_array, new_null_array, Array};
+use crate::bitmap::Bitmap;
+use crate::datatypes::{DataType, Field};
+use crate::error::Error;
+
+#[cfg(feature = "arrow")]
+mod data;
+mod ffi;
+pub(super) mod fmt;
+mod iterator;
+mod mutable;
+pub use mutable::*;
+
+/// A [`StructArray`] is a nested [`Array`] with an optional validity representing
+/// multiple [`Array`] with the same number of rows.
+/// # Example
+/// ```
+/// use arrow2::array::*;
+/// use arrow2::datatypes::*;
+/// let boolean = BooleanArray::from_slice(&[false, false, true, true]).boxed();
+/// let int = Int32Array::from_slice(&[42, 28, 19, 31]).boxed();
+///
+/// let fields = vec![
+///     Field::new("b", DataType::Boolean, false),
+///     Field::new("c", DataType::Int32, false),
+/// ];
+///
+/// let array = StructArray::new(DataType::Struct(fields), vec![boolean, int], None);
+/// ```
+#[derive(Clone)]
+pub struct StructArray {
+    data_type: DataType,
+    values: Vec<Box<dyn Array>>,
+    validity: Option<Bitmap>,
+}
+
+impl StructArray {
+    /// Returns a new [`StructArray`].
+    /// # Errors
+    /// This function errors iff:
+    /// * `data_type`'s physical type is not [`crate::datatypes::PhysicalType::Struct`].
+    /// * the children of `data_type` are empty
+    /// * the values's len is different from children's length
+    /// * any of the values's data type is different from its corresponding children' data type
+    /// * any element of values has a different length than the first element
+    /// * the validity's length is not equal to the length of the first element
+    pub fn try_new(
+        data_type: DataType,
+        values: Vec<Box<dyn Array>>,
+        validity: Option<Bitmap>,
+    ) -> Result<Self, Error> {
+        let fields = Self::try_get_fields(&data_type)?;
+        if fields.is_empty() {
+            return Err(Error::oos("A StructArray must contain at least one field"));
+        }
+        if fields.len() != values.len() {
+            return Err(Error::oos(
+                "A StructArray must have a number of fields in its DataType equal to the number of child values",
+            ));
+        }
+
+        fields
+            .iter().map(|a| &a.data_type)
+            .zip(values.iter().map(|a| a.data_type()))
+            .enumerate()
+            .try_for_each(|(index, (data_type, child))| {
+                if data_type != child {
+                    Err(Error::oos(format!(
+                        "The children DataTypes of a StructArray must equal the children data types. 
+                         However, the field {index} has data type {data_type:?} but the value has data type {child:?}"
+                    )))
+                } else {
+                    Ok(())
+                }
+            })?;
+
+        let len = values[0].len();
+        values
+            .iter()
+            .map(|a| a.len())
+            .enumerate()
+            .try_for_each(|(index, a_len)| {
+                if a_len != len {
+                    Err(Error::oos(format!(
+                        "The children must have an equal number of values.
+                         However, the values at index {index} have a length of {a_len}, which is different from values at index 0, {len}."
+                    )))
+                } else {
+                    Ok(())
+                }
+            })?;
+
+        if validity
+            .as_ref()
+            .map_or(false, |validity| validity.len() != len)
+        {
+            return Err(Error::oos(
+                "The validity length of a StructArray must match its number of elements",
+            ));
+        }
+
+        Ok(Self {
+            data_type,
+            values,
+            validity,
+        })
+    }
+
+    /// Returns a new [`StructArray`]
+    /// # Panics
+    /// This function panics iff:
+    /// * `data_type`'s physical type is not [`crate::datatypes::PhysicalType::Struct`].
+    /// * the children of `data_type` are empty
+    /// * the values's len is different from children's length
+    /// * any of the values's data type is different from its corresponding children' data type
+    /// * any element of values has a different length than the first element
+    /// * the validity's length is not equal to the length of the first element
+    pub fn new(data_type: DataType, values: Vec<Box<dyn Array>>, validity: Option<Bitmap>) -> Self {
+        Self::try_new(data_type, values, validity).unwrap()
+    }
+
+    /// Creates an empty [`StructArray`].
+    pub fn new_empty(data_type: DataType) -> Self {
+        if let DataType::Struct(fields) = &data_type.to_logical_type() {
+            let values = fields
+                .iter()
+                .map(|field| new_empty_array(field.data_type().clone()))
+                .collect();
+            Self::new(data_type, values, None)
+        } else {
+            panic!("StructArray must be initialized with DataType::Struct");
+        }
+    }
+
+    /// Creates a null [`StructArray`] of length `length`.
+    pub fn new_null(data_type: DataType, length: usize) -> Self {
+        if let DataType::Struct(fields) = &data_type {
+            let values = fields
+                .iter()
+                .map(|field| new_null_array(field.data_type().clone(), length))
+                .collect();
+            Self::new(data_type, values, Some(Bitmap::new_zeroed(length)))
+        } else {
+            panic!("StructArray must be initialized with DataType::Struct");
+        }
+    }
+}
+
+// must use
+impl StructArray {
+    /// Deconstructs the [`StructArray`] into its individual components.
+    #[must_use]
+    pub fn into_data(self) -> (Vec<Field>, Vec<Box<dyn Array>>, Option<Bitmap>) {
+        let Self {
+            data_type,
+            values,
+            validity,
+        } = self;
+        let fields = if let DataType::Struct(fields) = data_type {
+            fields
+        } else {
+            unreachable!()
+        };
+        (fields, values, validity)
+    }
+
+    /// Slices this [`StructArray`].
+    /// # Panics
+    /// * `offset + length` must be smaller than `self.len()`.
+    /// # Implementation
+    /// This operation is `O(F)` where `F` is the number of fields.
+    pub fn slice(&mut self, offset: usize, length: usize) {
+        assert!(
+            offset + length <= self.len(),
+            "offset + length may not exceed length of array"
+        );
+        unsafe { self.slice_unchecked(offset, length) }
+    }
+
+    /// Slices this [`StructArray`].
+    /// # Implementation
+    /// This operation is `O(F)` where `F` is the number of fields.
+    /// # Safety
+    /// The caller must ensure that `offset + length <= self.len()`.
+    pub unsafe fn slice_unchecked(&mut self, offset: usize, length: usize) {
+        self.validity.as_mut().and_then(|bitmap| {
+            bitmap.slice_unchecked(offset, length);
+            (bitmap.unset_bits() > 0).then(|| bitmap)
+        });
+        self.values
+            .iter_mut()
+            .for_each(|x| x.slice_unchecked(offset, length));
+    }
+
+    impl_sliced!();
+
+    impl_mut_validity!();
+
+    impl_into_array!();
+}
+
+// Accessors
+impl StructArray {
+    #[inline]
+    fn len(&self) -> usize {
+        self.values[0].len()
+    }
+
+    /// The optional validity.
+    #[inline]
+    pub fn validity(&self) -> Option<&Bitmap> {
+        self.validity.as_ref()
+    }
+
+    /// Returns the values of this [`StructArray`].
+    pub fn values(&self) -> &[Box<dyn Array>] {
+        &self.values
+    }
+
+    /// Returns the fields of this [`StructArray`].
+    pub fn fields(&self) -> &[Field] {
+        Self::get_fields(&self.data_type)
+    }
+}
+
+impl StructArray {
+    /// Returns the fields the `DataType::Struct`.
+    pub(crate) fn try_get_fields(data_type: &DataType) -> Result<&[Field], Error> {
+        match data_type.to_logical_type() {
+            DataType::Struct(fields) => Ok(fields),
+            _ => Err(Error::oos(
+                "Struct array must be created with a DataType whose physical type is Struct",
+            )),
+        }
+    }
+
+    /// Returns the fields the `DataType::Struct`.
+    pub fn get_fields(data_type: &DataType) -> &[Field] {
+        Self::try_get_fields(data_type).unwrap()
+    }
+}
+
+impl Array for StructArray {
+    impl_common_array!();
+
+    fn validity(&self) -> Option<&Bitmap> {
+        self.validity.as_ref()
+    }
+
+    #[inline]
+    fn with_validity(&self, validity: Option<Bitmap>) -> Box<dyn Array> {
+        Box::new(self.clone().with_validity(validity))
+    }
+}
diff --git a/crates/nano-arrow/src/array/struct_/mutable.rs b/crates/nano-arrow/src/array/struct_/mutable.rs
new file mode 100644
index 000000000000..8060a698fb63
--- /dev/null
+++ b/crates/nano-arrow/src/array/struct_/mutable.rs
@@ -0,0 +1,245 @@
+use std::sync::Arc;
+
+use super::StructArray;
+use crate::array::{Array, MutableArray};
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::DataType;
+use crate::error::Error;
+
+/// Converting a [`MutableStructArray`] into a [`StructArray`] is `O(1)`.
+#[derive(Debug)]
+pub struct MutableStructArray {
+    data_type: DataType,
+    values: Vec<Box<dyn MutableArray>>,
+    validity: Option<MutableBitmap>,
+}
+
+fn check(
+    data_type: &DataType,
+    values: &[Box<dyn MutableArray>],
+    validity: Option<usize>,
+) -> Result<(), Error> {
+    let fields = StructArray::try_get_fields(data_type)?;
+    if fields.is_empty() {
+        return Err(Error::oos("A StructArray must contain at least one field"));
+    }
+    if fields.len() != values.len() {
+        return Err(Error::oos(
+                "A StructArray must have a number of fields in its DataType equal to the number of child values",
+            ));
+    }
+
+    fields
+            .iter().map(|a| &a.data_type)
+            .zip(values.iter().map(|a| a.data_type()))
+            .enumerate()
+            .try_for_each(|(index, (data_type, child))| {
+                if data_type != child {
+                    Err(Error::oos(format!(
+                        "The children DataTypes of a StructArray must equal the children data types. 
+                         However, the field {index} has data type {data_type:?} but the value has data type {child:?}"
+                    )))
+                } else {
+                    Ok(())
+                }
+            })?;
+
+    let len = values[0].len();
+    values
+            .iter()
+            .map(|a| a.len())
+            .enumerate()
+            .try_for_each(|(index, a_len)| {
+                if a_len != len {
+                    Err(Error::oos(format!(
+                        "The children must have an equal number of values.
+                         However, the values at index {index} have a length of {a_len}, which is different from values at index 0, {len}."
+                    )))
+                } else {
+                    Ok(())
+                }
+            })?;
+
+    if validity.map_or(false, |validity| validity != len) {
+        return Err(Error::oos(
+            "The validity length of a StructArray must match its number of elements",
+        ));
+    }
+    Ok(())
+}
+
+impl From<MutableStructArray> for StructArray {
+    fn from(other: MutableStructArray) -> Self {
+        let validity = if other.validity.as_ref().map(|x| x.unset_bits()).unwrap_or(0) > 0 {
+            other.validity.map(|x| x.into())
+        } else {
+            None
+        };
+
+        StructArray::new(
+            other.data_type,
+            other.values.into_iter().map(|mut v| v.as_box()).collect(),
+            validity,
+        )
+    }
+}
+
+impl MutableStructArray {
+    /// Creates a new [`MutableStructArray`].
+    pub fn new(data_type: DataType, values: Vec<Box<dyn MutableArray>>) -> Self {
+        Self::try_new(data_type, values, None).unwrap()
+    }
+
+    /// Create a [`MutableStructArray`] out of low-end APIs.
+    /// # Errors
+    /// This function errors iff:
+    /// * `data_type` is not [`DataType::Struct`]
+    /// * The inner types of `data_type` are not equal to those of `values`
+    /// * `validity` is not `None` and its length is different from the `values`'s length
+    pub fn try_new(
+        data_type: DataType,
+        values: Vec<Box<dyn MutableArray>>,
+        validity: Option<MutableBitmap>,
+    ) -> Result<Self, Error> {
+        check(&data_type, &values, validity.as_ref().map(|x| x.len()))?;
+        Ok(Self {
+            data_type,
+            values,
+            validity,
+        })
+    }
+
+    /// Extract the low-end APIs from the [`MutableStructArray`].
+    pub fn into_inner(self) -> (DataType, Vec<Box<dyn MutableArray>>, Option<MutableBitmap>) {
+        (self.data_type, self.values, self.validity)
+    }
+
+    /// The mutable values
+    pub fn mut_values(&mut self) -> &mut Vec<Box<dyn MutableArray>> {
+        &mut self.values
+    }
+
+    /// The values
+    pub fn values(&self) -> &Vec<Box<dyn MutableArray>> {
+        &self.values
+    }
+
+    /// Return the `i`th child array.
+    pub fn value<A: MutableArray + 'static>(&mut self, i: usize) -> Option<&mut A> {
+        self.values[i].as_mut_any().downcast_mut::<A>()
+    }
+}
+
+impl MutableStructArray {
+    /// Reserves `additional` entries.
+    pub fn reserve(&mut self, additional: usize) {
+        for v in &mut self.values {
+            v.reserve(additional);
+        }
+        if let Some(x) = self.validity.as_mut() {
+            x.reserve(additional)
+        }
+    }
+
+    /// Call this once for each "row" of children you push.
+    pub fn push(&mut self, valid: bool) {
+        match &mut self.validity {
+            Some(validity) => validity.push(valid),
+            None => match valid {
+                true => (),
+                false => self.init_validity(),
+            },
+        };
+    }
+
+    fn push_null(&mut self) {
+        for v in &mut self.values {
+            v.push_null();
+        }
+        self.push(false);
+    }
+
+    fn init_validity(&mut self) {
+        let mut validity = MutableBitmap::with_capacity(self.values.capacity());
+        let len = self.len();
+        if len > 0 {
+            validity.extend_constant(len, true);
+            validity.set(len - 1, false);
+        }
+        self.validity = Some(validity)
+    }
+
+    /// Converts itself into an [`Array`].
+    pub fn into_arc(self) -> Arc<dyn Array> {
+        let a: StructArray = self.into();
+        Arc::new(a)
+    }
+
+    /// Shrinks the capacity of the [`MutableStructArray`] to fit its current length.
+    pub fn shrink_to_fit(&mut self) {
+        for v in &mut self.values {
+            v.shrink_to_fit();
+        }
+        if let Some(validity) = self.validity.as_mut() {
+            validity.shrink_to_fit()
+        }
+    }
+}
+
+impl MutableArray for MutableStructArray {
+    fn len(&self) -> usize {
+        self.values.first().map(|v| v.len()).unwrap_or(0)
+    }
+
+    fn validity(&self) -> Option<&MutableBitmap> {
+        self.validity.as_ref()
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        StructArray::new(
+            self.data_type.clone(),
+            std::mem::take(&mut self.values)
+                .into_iter()
+                .map(|mut v| v.as_box())
+                .collect(),
+            std::mem::take(&mut self.validity).map(|x| x.into()),
+        )
+        .boxed()
+    }
+
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        StructArray::new(
+            self.data_type.clone(),
+            std::mem::take(&mut self.values)
+                .into_iter()
+                .map(|mut v| v.as_box())
+                .collect(),
+            std::mem::take(&mut self.validity).map(|x| x.into()),
+        )
+        .arced()
+    }
+
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    fn as_mut_any(&mut self) -> &mut dyn std::any::Any {
+        self
+    }
+
+    fn push_null(&mut self) {
+        self.push_null()
+    }
+
+    fn shrink_to_fit(&mut self) {
+        self.shrink_to_fit()
+    }
+
+    fn reserve(&mut self, additional: usize) {
+        self.reserve(additional)
+    }
+}
diff --git a/crates/nano-arrow/src/array/union/data.rs b/crates/nano-arrow/src/array/union/data.rs
new file mode 100644
index 000000000000..6de6c0074231
--- /dev/null
+++ b/crates/nano-arrow/src/array/union/data.rs
@@ -0,0 +1,70 @@
+use arrow_data::{ArrayData, ArrayDataBuilder};
+
+use crate::array::{from_data, to_data, Arrow2Arrow, UnionArray};
+use crate::buffer::Buffer;
+use crate::datatypes::DataType;
+
+impl Arrow2Arrow for UnionArray {
+    fn to_data(&self) -> ArrayData {
+        let data_type = arrow_schema::DataType::from(self.data_type.clone());
+        let len = self.len();
+
+        let builder = match self.offsets.clone() {
+            Some(offsets) => ArrayDataBuilder::new(data_type)
+                .len(len)
+                .buffers(vec![self.types.clone().into(), offsets.into()])
+                .child_data(self.fields.iter().map(|x| to_data(x.as_ref())).collect()),
+            None => ArrayDataBuilder::new(data_type)
+                .len(len)
+                .buffers(vec![self.types.clone().into()])
+                .child_data(
+                    self.fields
+                        .iter()
+                        .map(|x| to_data(x.as_ref()).slice(self.offset, len))
+                        .collect(),
+                ),
+        };
+
+        // Safety: Array is valid
+        unsafe { builder.build_unchecked() }
+    }
+
+    fn from_data(data: &ArrayData) -> Self {
+        let data_type: DataType = data.data_type().clone().into();
+
+        let fields = data.child_data().iter().map(from_data).collect();
+        let buffers = data.buffers();
+        let mut types: Buffer<i8> = buffers[0].clone().into();
+        types.slice(data.offset(), data.len());
+        let offsets = match buffers.len() == 2 {
+            true => {
+                let mut offsets: Buffer<i32> = buffers[1].clone().into();
+                offsets.slice(data.offset(), data.len());
+                Some(offsets)
+            },
+            false => None,
+        };
+
+        // Map from type id to array index
+        let map = match &data_type {
+            DataType::Union(_, Some(ids), _) => {
+                let mut map = [0; 127];
+                for (pos, &id) in ids.iter().enumerate() {
+                    map[id as usize] = pos;
+                }
+                Some(map)
+            },
+            DataType::Union(_, None, _) => None,
+            _ => unreachable!("must be Union type"),
+        };
+
+        Self {
+            types,
+            map,
+            fields,
+            offsets,
+            data_type,
+            offset: data.offset(),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/array/union/ffi.rs b/crates/nano-arrow/src/array/union/ffi.rs
new file mode 100644
index 000000000000..590afec0c6c5
--- /dev/null
+++ b/crates/nano-arrow/src/array/union/ffi.rs
@@ -0,0 +1,60 @@
+use super::super::ffi::ToFfi;
+use super::super::Array;
+use super::UnionArray;
+use crate::array::FromFfi;
+use crate::error::Result;
+use crate::ffi;
+
+unsafe impl ToFfi for UnionArray {
+    fn buffers(&self) -> Vec<Option<*const u8>> {
+        if let Some(offsets) = &self.offsets {
+            vec![
+                Some(self.types.as_ptr().cast::<u8>()),
+                Some(offsets.as_ptr().cast::<u8>()),
+            ]
+        } else {
+            vec![Some(self.types.as_ptr().cast::<u8>())]
+        }
+    }
+
+    fn children(&self) -> Vec<Box<dyn Array>> {
+        self.fields.clone()
+    }
+
+    fn offset(&self) -> Option<usize> {
+        Some(self.types.offset())
+    }
+
+    fn to_ffi_aligned(&self) -> Self {
+        self.clone()
+    }
+}
+
+impl<A: ffi::ArrowArrayRef> FromFfi<A> for UnionArray {
+    unsafe fn try_from_ffi(array: A) -> Result<Self> {
+        let data_type = array.data_type().clone();
+        let fields = Self::get_fields(&data_type);
+
+        let mut types = unsafe { array.buffer::<i8>(0) }?;
+        let offsets = if Self::is_sparse(&data_type) {
+            None
+        } else {
+            Some(unsafe { array.buffer::<i32>(1) }?)
+        };
+
+        let length = array.array().len();
+        let offset = array.array().offset();
+        let fields = (0..fields.len())
+            .map(|index| {
+                let child = array.child(index)?;
+                ffi::try_from(child)
+            })
+            .collect::<Result<Vec<Box<dyn Array>>>>()?;
+
+        if offset > 0 {
+            types.slice(offset, length);
+        };
+
+        Self::try_new(data_type, types, fields, offsets)
+    }
+}
diff --git a/crates/nano-arrow/src/array/union/fmt.rs b/crates/nano-arrow/src/array/union/fmt.rs
new file mode 100644
index 000000000000..521201fffd6d
--- /dev/null
+++ b/crates/nano-arrow/src/array/union/fmt.rs
@@ -0,0 +1,24 @@
+use std::fmt::{Debug, Formatter, Result, Write};
+
+use super::super::fmt::{get_display, write_vec};
+use super::UnionArray;
+
+pub fn write_value<W: Write>(
+    array: &UnionArray,
+    index: usize,
+    null: &'static str,
+    f: &mut W,
+) -> Result {
+    let (field, index) = array.index(index);
+
+    get_display(array.fields()[field].as_ref(), null)(f, index)
+}
+
+impl Debug for UnionArray {
+    fn fmt(&self, f: &mut Formatter<'_>) -> Result {
+        let writer = |f: &mut Formatter, index| write_value(self, index, "None", f);
+
+        write!(f, "UnionArray")?;
+        write_vec(f, writer, None, self.len(), "None", false)
+    }
+}
diff --git a/crates/nano-arrow/src/array/union/iterator.rs b/crates/nano-arrow/src/array/union/iterator.rs
new file mode 100644
index 000000000000..bdcf5825af6c
--- /dev/null
+++ b/crates/nano-arrow/src/array/union/iterator.rs
@@ -0,0 +1,59 @@
+use super::UnionArray;
+use crate::scalar::Scalar;
+use crate::trusted_len::TrustedLen;
+
+#[derive(Debug, Clone)]
+pub struct UnionIter<'a> {
+    array: &'a UnionArray,
+    current: usize,
+}
+
+impl<'a> UnionIter<'a> {
+    #[inline]
+    pub fn new(array: &'a UnionArray) -> Self {
+        Self { array, current: 0 }
+    }
+}
+
+impl<'a> Iterator for UnionIter<'a> {
+    type Item = Box<dyn Scalar>;
+
+    #[inline]
+    fn next(&mut self) -> Option<Self::Item> {
+        if self.current == self.array.len() {
+            None
+        } else {
+            let old = self.current;
+            self.current += 1;
+            Some(unsafe { self.array.value_unchecked(old) })
+        }
+    }
+
+    #[inline]
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        let len = self.array.len() - self.current;
+        (len, Some(len))
+    }
+}
+
+impl<'a> IntoIterator for &'a UnionArray {
+    type Item = Box<dyn Scalar>;
+    type IntoIter = UnionIter<'a>;
+
+    #[inline]
+    fn into_iter(self) -> Self::IntoIter {
+        self.iter()
+    }
+}
+
+impl<'a> UnionArray {
+    /// constructs a new iterator
+    #[inline]
+    pub fn iter(&'a self) -> UnionIter<'a> {
+        UnionIter::new(self)
+    }
+}
+
+impl<'a> std::iter::ExactSizeIterator for UnionIter<'a> {}
+
+unsafe impl<'a> TrustedLen for UnionIter<'a> {}
diff --git a/crates/nano-arrow/src/array/union/mod.rs b/crates/nano-arrow/src/array/union/mod.rs
new file mode 100644
index 000000000000..75c83fb91759
--- /dev/null
+++ b/crates/nano-arrow/src/array/union/mod.rs
@@ -0,0 +1,377 @@
+use super::{new_empty_array, new_null_array, Array};
+use crate::bitmap::Bitmap;
+use crate::buffer::Buffer;
+use crate::datatypes::{DataType, Field, UnionMode};
+use crate::error::Error;
+use crate::scalar::{new_scalar, Scalar};
+
+#[cfg(feature = "arrow")]
+mod data;
+mod ffi;
+pub(super) mod fmt;
+mod iterator;
+
+type UnionComponents<'a> = (&'a [Field], Option<&'a [i32]>, UnionMode);
+
+/// [`UnionArray`] represents an array whose each slot can contain different values.
+///
+// How to read a value at slot i:
+// ```
+// let index = self.types()[i] as usize;
+// let field = self.fields()[index];
+// let offset = self.offsets().map(|x| x[index]).unwrap_or(i);
+// let field = field.as_any().downcast to correct type;
+// let value = field.value(offset);
+// ```
+#[derive(Clone)]
+pub struct UnionArray {
+    // Invariant: every item in `types` is `> 0 && < fields.len()`
+    types: Buffer<i8>,
+    // Invariant: `map.len() == fields.len()`
+    // Invariant: every item in `map` is `> 0 && < fields.len()`
+    map: Option<[usize; 127]>,
+    fields: Vec<Box<dyn Array>>,
+    // Invariant: when set, `offsets.len() == types.len()`
+    offsets: Option<Buffer<i32>>,
+    data_type: DataType,
+    offset: usize,
+}
+
+impl UnionArray {
+    /// Returns a new [`UnionArray`].
+    /// # Errors
+    /// This function errors iff:
+    /// * `data_type`'s physical type is not [`crate::datatypes::PhysicalType::Union`].
+    /// * the fields's len is different from the `data_type`'s children's length
+    /// * The number of `fields` is larger than `i8::MAX`
+    /// * any of the values's data type is different from its corresponding children' data type
+    pub fn try_new(
+        data_type: DataType,
+        types: Buffer<i8>,
+        fields: Vec<Box<dyn Array>>,
+        offsets: Option<Buffer<i32>>,
+    ) -> Result<Self, Error> {
+        let (f, ids, mode) = Self::try_get_all(&data_type)?;
+
+        if f.len() != fields.len() {
+            return Err(Error::oos(
+                "The number of `fields` must equal the number of children fields in DataType::Union",
+            ));
+        };
+        let number_of_fields: i8 = fields
+            .len()
+            .try_into()
+            .map_err(|_| Error::oos("The number of `fields` cannot be larger than i8::MAX"))?;
+
+        f
+            .iter().map(|a| a.data_type())
+            .zip(fields.iter().map(|a| a.data_type()))
+            .enumerate()
+            .try_for_each(|(index, (data_type, child))| {
+                if data_type != child {
+                    Err(Error::oos(format!(
+                        "The children DataTypes of a UnionArray must equal the children data types. 
+                         However, the field {index} has data type {data_type:?} but the value has data type {child:?}"
+                    )))
+                } else {
+                    Ok(())
+                }
+            })?;
+
+        if let Some(offsets) = &offsets {
+            if offsets.len() != types.len() {
+                return Err(Error::oos(
+                    "In a UnionArray, the offsets' length must be equal to the number of types",
+                ));
+            }
+        }
+        if offsets.is_none() != mode.is_sparse() {
+            return Err(Error::oos(
+                "In a sparse UnionArray, the offsets must be set (and vice-versa)",
+            ));
+        }
+
+        // build hash
+        let map = if let Some(&ids) = ids.as_ref() {
+            if ids.len() != fields.len() {
+                return Err(Error::oos(
+                    "In a union, when the ids are set, their length must be equal to the number of fields",
+                ));
+            }
+
+            // example:
+            // * types = [5, 7, 5, 7, 7, 7, 5, 7, 7, 5, 5]
+            // * ids = [5, 7]
+            // => hash = [0, 0, 0, 0, 0, 0, 1, 0, ...]
+            let mut hash = [0; 127];
+
+            for (pos, &id) in ids.iter().enumerate() {
+                if !(0..=127).contains(&id) {
+                    return Err(Error::oos(
+                        "In a union, when the ids are set, every id must belong to [0, 128[",
+                    ));
+                }
+                hash[id as usize] = pos;
+            }
+
+            types.iter().try_for_each(|&type_| {
+                if type_ < 0 {
+                    return Err(Error::oos("In a union, when the ids are set, every type must be >= 0"));
+                }
+                let id = hash[type_ as usize];
+                if id >= fields.len() {
+                    Err(Error::oos("In a union, when the ids are set, each id must be smaller than the number of fields."))
+                } else {
+                    Ok(())
+                }
+            })?;
+
+            Some(hash)
+        } else {
+            // Safety: every type in types is smaller than number of fields
+            let mut is_valid = true;
+            for &type_ in types.iter() {
+                if type_ < 0 || type_ >= number_of_fields {
+                    is_valid = false
+                }
+            }
+            if !is_valid {
+                return Err(Error::oos(
+                    "Every type in `types` must be larger than 0 and smaller than the number of fields.",
+                ));
+            }
+
+            None
+        };
+
+        Ok(Self {
+            data_type,
+            map,
+            fields,
+            offsets,
+            types,
+            offset: 0,
+        })
+    }
+
+    /// Returns a new [`UnionArray`].
+    /// # Panics
+    /// This function panics iff:
+    /// * `data_type`'s physical type is not [`crate::datatypes::PhysicalType::Union`].
+    /// * the fields's len is different from the `data_type`'s children's length
+    /// * any of the values's data type is different from its corresponding children' data type
+    pub fn new(
+        data_type: DataType,
+        types: Buffer<i8>,
+        fields: Vec<Box<dyn Array>>,
+        offsets: Option<Buffer<i32>>,
+    ) -> Self {
+        Self::try_new(data_type, types, fields, offsets).unwrap()
+    }
+
+    /// Creates a new null [`UnionArray`].
+    pub fn new_null(data_type: DataType, length: usize) -> Self {
+        if let DataType::Union(f, _, mode) = &data_type {
+            let fields = f
+                .iter()
+                .map(|x| new_null_array(x.data_type().clone(), length))
+                .collect();
+
+            let offsets = if mode.is_sparse() {
+                None
+            } else {
+                Some((0..length as i32).collect::<Vec<_>>().into())
+            };
+
+            // all from the same field
+            let types = vec![0i8; length].into();
+
+            Self::new(data_type, types, fields, offsets)
+        } else {
+            panic!("Union struct must be created with the corresponding Union DataType")
+        }
+    }
+
+    /// Creates a new empty [`UnionArray`].
+    pub fn new_empty(data_type: DataType) -> Self {
+        if let DataType::Union(f, _, mode) = data_type.to_logical_type() {
+            let fields = f
+                .iter()
+                .map(|x| new_empty_array(x.data_type().clone()))
+                .collect();
+
+            let offsets = if mode.is_sparse() {
+                None
+            } else {
+                Some(Buffer::default())
+            };
+
+            Self {
+                data_type,
+                map: None,
+                fields,
+                offsets,
+                types: Buffer::new(),
+                offset: 0,
+            }
+        } else {
+            panic!("Union struct must be created with the corresponding Union DataType")
+        }
+    }
+}
+
+impl UnionArray {
+    /// Returns a slice of this [`UnionArray`].
+    /// # Implementation
+    /// This operation is `O(F)` where `F` is the number of fields.
+    /// # Panic
+    /// This function panics iff `offset + length >= self.len()`.
+    #[inline]
+    pub fn slice(&mut self, offset: usize, length: usize) {
+        assert!(
+            offset + length <= self.len(),
+            "the offset of the new array cannot exceed the existing length"
+        );
+        unsafe { self.slice_unchecked(offset, length) }
+    }
+
+    /// Returns a slice of this [`UnionArray`].
+    /// # Implementation
+    /// This operation is `O(F)` where `F` is the number of fields.
+    /// # Safety
+    /// The caller must ensure that `offset + length <= self.len()`.
+    #[inline]
+    pub unsafe fn slice_unchecked(&mut self, offset: usize, length: usize) {
+        debug_assert!(offset + length <= self.len());
+
+        self.types.slice_unchecked(offset, length);
+        if let Some(offsets) = self.offsets.as_mut() {
+            offsets.slice_unchecked(offset, length)
+        }
+        self.offset += offset;
+    }
+
+    impl_sliced!();
+    impl_into_array!();
+}
+
+impl UnionArray {
+    /// Returns the length of this array
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.types.len()
+    }
+
+    /// The optional offsets.
+    pub fn offsets(&self) -> Option<&Buffer<i32>> {
+        self.offsets.as_ref()
+    }
+
+    /// The fields.
+    pub fn fields(&self) -> &Vec<Box<dyn Array>> {
+        &self.fields
+    }
+
+    /// The types.
+    pub fn types(&self) -> &Buffer<i8> {
+        &self.types
+    }
+
+    #[inline]
+    unsafe fn field_slot_unchecked(&self, index: usize) -> usize {
+        self.offsets()
+            .as_ref()
+            .map(|x| *x.get_unchecked(index) as usize)
+            .unwrap_or(index + self.offset)
+    }
+
+    /// Returns the index and slot of the field to select from `self.fields`.
+    #[inline]
+    pub fn index(&self, index: usize) -> (usize, usize) {
+        assert!(index < self.len());
+        unsafe { self.index_unchecked(index) }
+    }
+
+    /// Returns the index and slot of the field to select from `self.fields`.
+    /// The first value is guaranteed to be `< self.fields().len()`
+    /// # Safety
+    /// This function is safe iff `index < self.len`.
+    #[inline]
+    pub unsafe fn index_unchecked(&self, index: usize) -> (usize, usize) {
+        debug_assert!(index < self.len());
+        // Safety: assumption of the function
+        let type_ = unsafe { *self.types.get_unchecked(index) };
+        // Safety: assumption of the struct
+        let type_ = self
+            .map
+            .as_ref()
+            .map(|map| unsafe { *map.get_unchecked(type_ as usize) })
+            .unwrap_or(type_ as usize);
+        // Safety: assumption of the function
+        let index = self.field_slot_unchecked(index);
+        (type_, index)
+    }
+
+    /// Returns the slot `index` as a [`Scalar`].
+    /// # Panics
+    /// iff `index >= self.len()`
+    pub fn value(&self, index: usize) -> Box<dyn Scalar> {
+        assert!(index < self.len());
+        unsafe { self.value_unchecked(index) }
+    }
+
+    /// Returns the slot `index` as a [`Scalar`].
+    /// # Safety
+    /// This function is safe iff `i < self.len`.
+    pub unsafe fn value_unchecked(&self, index: usize) -> Box<dyn Scalar> {
+        debug_assert!(index < self.len());
+        let (type_, index) = self.index_unchecked(index);
+        // Safety: assumption of the struct
+        debug_assert!(type_ < self.fields.len());
+        let field = self.fields.get_unchecked(type_).as_ref();
+        new_scalar(field, index)
+    }
+}
+
+impl Array for UnionArray {
+    impl_common_array!();
+
+    fn validity(&self) -> Option<&Bitmap> {
+        None
+    }
+
+    fn with_validity(&self, _: Option<Bitmap>) -> Box<dyn Array> {
+        panic!("cannot set validity of a union array")
+    }
+}
+
+impl UnionArray {
+    fn try_get_all(data_type: &DataType) -> Result<UnionComponents, Error> {
+        match data_type.to_logical_type() {
+            DataType::Union(fields, ids, mode) => {
+                Ok((fields, ids.as_ref().map(|x| x.as_ref()), *mode))
+            },
+            _ => Err(Error::oos(
+                "The UnionArray requires a logical type of DataType::Union",
+            )),
+        }
+    }
+
+    fn get_all(data_type: &DataType) -> (&[Field], Option<&[i32]>, UnionMode) {
+        Self::try_get_all(data_type).unwrap()
+    }
+
+    /// Returns all fields from [`DataType::Union`].
+    /// # Panic
+    /// Panics iff `data_type`'s logical type is not [`DataType::Union`].
+    pub fn get_fields(data_type: &DataType) -> &[Field] {
+        Self::get_all(data_type).0
+    }
+
+    /// Returns whether the [`DataType::Union`] is sparse or not.
+    /// # Panic
+    /// Panics iff `data_type`'s logical type is not [`DataType::Union`].
+    pub fn is_sparse(data_type: &DataType) -> bool {
+        Self::get_all(data_type).2.is_sparse()
+    }
+}
diff --git a/crates/nano-arrow/src/array/utf8/data.rs b/crates/nano-arrow/src/array/utf8/data.rs
new file mode 100644
index 000000000000..16674c969372
--- /dev/null
+++ b/crates/nano-arrow/src/array/utf8/data.rs
@@ -0,0 +1,42 @@
+use arrow_data::{ArrayData, ArrayDataBuilder};
+
+use crate::array::{Arrow2Arrow, Utf8Array};
+use crate::bitmap::Bitmap;
+use crate::offset::{Offset, OffsetsBuffer};
+
+impl<O: Offset> Arrow2Arrow for Utf8Array<O> {
+    fn to_data(&self) -> ArrayData {
+        let data_type = self.data_type().clone().into();
+        let builder = ArrayDataBuilder::new(data_type)
+            .len(self.offsets().len_proxy())
+            .buffers(vec![
+                self.offsets.clone().into_inner().into(),
+                self.values.clone().into(),
+            ])
+            .nulls(self.validity.as_ref().map(|b| b.clone().into()));
+
+        // Safety: Array is valid
+        unsafe { builder.build_unchecked() }
+    }
+
+    fn from_data(data: &ArrayData) -> Self {
+        let data_type = data.data_type().clone().into();
+        if data.is_empty() {
+            // Handle empty offsets
+            return Self::new_empty(data_type);
+        }
+
+        let buffers = data.buffers();
+
+        // Safety: ArrayData is valid
+        let mut offsets = unsafe { OffsetsBuffer::new_unchecked(buffers[0].clone().into()) };
+        offsets.slice(data.offset(), data.len() + 1);
+
+        Self {
+            data_type,
+            offsets,
+            values: buffers[1].clone().into(),
+            validity: data.nulls().map(|n| Bitmap::from_null_buffer(n.clone())),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/array/utf8/ffi.rs b/crates/nano-arrow/src/array/utf8/ffi.rs
new file mode 100644
index 000000000000..2129a85a6f8f
--- /dev/null
+++ b/crates/nano-arrow/src/array/utf8/ffi.rs
@@ -0,0 +1,62 @@
+use super::Utf8Array;
+use crate::array::{FromFfi, ToFfi};
+use crate::bitmap::align;
+use crate::error::Result;
+use crate::ffi;
+use crate::offset::{Offset, OffsetsBuffer};
+
+unsafe impl<O: Offset> ToFfi for Utf8Array<O> {
+    fn buffers(&self) -> Vec<Option<*const u8>> {
+        vec![
+            self.validity.as_ref().map(|x| x.as_ptr()),
+            Some(self.offsets.buffer().as_ptr().cast::<u8>()),
+            Some(self.values.as_ptr().cast::<u8>()),
+        ]
+    }
+
+    fn offset(&self) -> Option<usize> {
+        let offset = self.offsets.buffer().offset();
+        if let Some(bitmap) = self.validity.as_ref() {
+            if bitmap.offset() == offset {
+                Some(offset)
+            } else {
+                None
+            }
+        } else {
+            Some(offset)
+        }
+    }
+
+    fn to_ffi_aligned(&self) -> Self {
+        let offset = self.offsets.buffer().offset();
+
+        let validity = self.validity.as_ref().map(|bitmap| {
+            if bitmap.offset() == offset {
+                bitmap.clone()
+            } else {
+                align(bitmap, offset)
+            }
+        });
+
+        Self {
+            data_type: self.data_type.clone(),
+            validity,
+            offsets: self.offsets.clone(),
+            values: self.values.clone(),
+        }
+    }
+}
+
+impl<O: Offset, A: ffi::ArrowArrayRef> FromFfi<A> for Utf8Array<O> {
+    unsafe fn try_from_ffi(array: A) -> Result<Self> {
+        let data_type = array.data_type().clone();
+        let validity = unsafe { array.validity() }?;
+        let offsets = unsafe { array.buffer::<O>(1) }?;
+        let values = unsafe { array.buffer::<u8>(2)? };
+
+        // assumption that data from FFI is well constructed
+        let offsets = unsafe { OffsetsBuffer::new_unchecked(offsets) };
+
+        Ok(Self::new_unchecked(data_type, offsets, values, validity))
+    }
+}
diff --git a/crates/nano-arrow/src/array/utf8/fmt.rs b/crates/nano-arrow/src/array/utf8/fmt.rs
new file mode 100644
index 000000000000..4466444ffe3b
--- /dev/null
+++ b/crates/nano-arrow/src/array/utf8/fmt.rs
@@ -0,0 +1,23 @@
+use std::fmt::{Debug, Formatter, Result, Write};
+
+use super::super::fmt::write_vec;
+use super::Utf8Array;
+use crate::offset::Offset;
+
+pub fn write_value<O: Offset, W: Write>(array: &Utf8Array<O>, index: usize, f: &mut W) -> Result {
+    write!(f, "{}", array.value(index))
+}
+
+impl<O: Offset> Debug for Utf8Array<O> {
+    fn fmt(&self, f: &mut Formatter<'_>) -> Result {
+        let writer = |f: &mut Formatter, index| write_value(self, index, f);
+
+        let head = if O::IS_LARGE {
+            "LargeUtf8Array"
+        } else {
+            "Utf8Array"
+        };
+        write!(f, "{head}")?;
+        write_vec(f, writer, self.validity(), self.len(), "None", false)
+    }
+}
diff --git a/crates/nano-arrow/src/array/utf8/from.rs b/crates/nano-arrow/src/array/utf8/from.rs
new file mode 100644
index 000000000000..c1dcaf09b10d
--- /dev/null
+++ b/crates/nano-arrow/src/array/utf8/from.rs
@@ -0,0 +1,11 @@
+use std::iter::FromIterator;
+
+use super::{MutableUtf8Array, Utf8Array};
+use crate::offset::Offset;
+
+impl<O: Offset, P: AsRef<str>> FromIterator<Option<P>> for Utf8Array<O> {
+    #[inline]
+    fn from_iter<I: IntoIterator<Item = Option<P>>>(iter: I) -> Self {
+        MutableUtf8Array::<O>::from_iter(iter).into()
+    }
+}
diff --git a/crates/nano-arrow/src/array/utf8/iterator.rs b/crates/nano-arrow/src/array/utf8/iterator.rs
new file mode 100644
index 000000000000..262b98c10d79
--- /dev/null
+++ b/crates/nano-arrow/src/array/utf8/iterator.rs
@@ -0,0 +1,79 @@
+use super::{MutableUtf8Array, MutableUtf8ValuesArray, Utf8Array};
+use crate::array::{ArrayAccessor, ArrayValuesIter};
+use crate::bitmap::utils::{BitmapIter, ZipValidity};
+use crate::offset::Offset;
+
+unsafe impl<'a, O: Offset> ArrayAccessor<'a> for Utf8Array<O> {
+    type Item = &'a str;
+
+    #[inline]
+    unsafe fn value_unchecked(&'a self, index: usize) -> Self::Item {
+        self.value_unchecked(index)
+    }
+
+    #[inline]
+    fn len(&self) -> usize {
+        self.len()
+    }
+}
+
+/// Iterator of values of an [`Utf8Array`].
+pub type Utf8ValuesIter<'a, O> = ArrayValuesIter<'a, Utf8Array<O>>;
+
+impl<'a, O: Offset> IntoIterator for &'a Utf8Array<O> {
+    type Item = Option<&'a str>;
+    type IntoIter = ZipValidity<&'a str, Utf8ValuesIter<'a, O>, BitmapIter<'a>>;
+
+    fn into_iter(self) -> Self::IntoIter {
+        self.iter()
+    }
+}
+
+unsafe impl<'a, O: Offset> ArrayAccessor<'a> for MutableUtf8Array<O> {
+    type Item = &'a str;
+
+    #[inline]
+    unsafe fn value_unchecked(&'a self, index: usize) -> Self::Item {
+        self.value_unchecked(index)
+    }
+
+    #[inline]
+    fn len(&self) -> usize {
+        self.len()
+    }
+}
+
+/// Iterator of values of an [`MutableUtf8ValuesArray`].
+pub type MutableUtf8ValuesIter<'a, O> = ArrayValuesIter<'a, MutableUtf8ValuesArray<O>>;
+
+impl<'a, O: Offset> IntoIterator for &'a MutableUtf8Array<O> {
+    type Item = Option<&'a str>;
+    type IntoIter = ZipValidity<&'a str, MutableUtf8ValuesIter<'a, O>, BitmapIter<'a>>;
+
+    fn into_iter(self) -> Self::IntoIter {
+        self.iter()
+    }
+}
+
+unsafe impl<'a, O: Offset> ArrayAccessor<'a> for MutableUtf8ValuesArray<O> {
+    type Item = &'a str;
+
+    #[inline]
+    unsafe fn value_unchecked(&'a self, index: usize) -> Self::Item {
+        self.value_unchecked(index)
+    }
+
+    #[inline]
+    fn len(&self) -> usize {
+        self.len()
+    }
+}
+
+impl<'a, O: Offset> IntoIterator for &'a MutableUtf8ValuesArray<O> {
+    type Item = &'a str;
+    type IntoIter = ArrayValuesIter<'a, MutableUtf8ValuesArray<O>>;
+
+    fn into_iter(self) -> Self::IntoIter {
+        self.iter()
+    }
+}
diff --git a/crates/nano-arrow/src/array/utf8/mod.rs b/crates/nano-arrow/src/array/utf8/mod.rs
new file mode 100644
index 000000000000..ab2c2a7bab8b
--- /dev/null
+++ b/crates/nano-arrow/src/array/utf8/mod.rs
@@ -0,0 +1,545 @@
+use either::Either;
+
+use super::specification::{try_check_offsets_bounds, try_check_utf8};
+use super::{Array, GenericBinaryArray};
+use crate::bitmap::utils::{BitmapIter, ZipValidity};
+use crate::bitmap::Bitmap;
+use crate::buffer::Buffer;
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+use crate::offset::{Offset, Offsets, OffsetsBuffer};
+use crate::trusted_len::TrustedLen;
+
+#[cfg(feature = "arrow")]
+mod data;
+mod ffi;
+pub(super) mod fmt;
+mod from;
+mod iterator;
+mod mutable;
+mod mutable_values;
+pub use iterator::*;
+pub use mutable::*;
+pub use mutable_values::MutableUtf8ValuesArray;
+
+// Auxiliary struct to allow presenting &str as [u8] to a generic function
+pub(super) struct StrAsBytes<P>(P);
+impl<T: AsRef<str>> AsRef<[u8]> for StrAsBytes<T> {
+    #[inline(always)]
+    fn as_ref(&self) -> &[u8] {
+        self.0.as_ref().as_bytes()
+    }
+}
+
+/// A [`Utf8Array`] is arrow's semantic equivalent of an immutable `Vec<Option<String>>`.
+/// Cloning and slicing this struct is `O(1)`.
+/// # Example
+/// ```
+/// use arrow2::bitmap::Bitmap;
+/// use arrow2::buffer::Buffer;
+/// use arrow2::array::Utf8Array;
+/// # fn main() {
+/// let array = Utf8Array::<i32>::from([Some("hi"), None, Some("there")]);
+/// assert_eq!(array.value(0), "hi");
+/// assert_eq!(array.iter().collect::<Vec<_>>(), vec![Some("hi"), None, Some("there")]);
+/// assert_eq!(array.values_iter().collect::<Vec<_>>(), vec!["hi", "", "there"]);
+/// // the underlying representation
+/// assert_eq!(array.validity(), Some(&Bitmap::from([true, false, true])));
+/// assert_eq!(array.values(), &Buffer::from(b"hithere".to_vec()));
+/// assert_eq!(array.offsets().buffer(), &Buffer::from(vec![0, 2, 2, 2 + 5]));
+/// # }
+/// ```
+///
+/// # Generic parameter
+/// The generic parameter [`Offset`] can only be `i32` or `i64` and tradeoffs maximum array length with
+/// memory usage:
+/// * the sum of lengths of all elements cannot exceed `Offset::MAX`
+/// * the total size of the underlying data is `array.len() * size_of::<Offset>() + sum of lengths of all elements`
+///
+/// # Safety
+/// The following invariants hold:
+/// * Two consecutives `offsets` casted (`as`) to `usize` are valid slices of `values`.
+/// * A slice of `values` taken from two consecutives `offsets` is valid `utf8`.
+/// * `len` is equal to `validity.len()`, when defined.
+#[derive(Clone)]
+pub struct Utf8Array<O: Offset> {
+    data_type: DataType,
+    offsets: OffsetsBuffer<O>,
+    values: Buffer<u8>,
+    validity: Option<Bitmap>,
+}
+
+// constructors
+impl<O: Offset> Utf8Array<O> {
+    /// Returns a [`Utf8Array`] created from its internal representation.
+    ///
+    /// # Errors
+    /// This function returns an error iff:
+    /// * The last offset is not equal to the values' length.
+    /// * the validity's length is not equal to `offsets.len()`.
+    /// * The `data_type`'s [`crate::datatypes::PhysicalType`] is not equal to either `Utf8` or `LargeUtf8`.
+    /// * The `values` between two consecutive `offsets` are not valid utf8
+    /// # Implementation
+    /// This function is `O(N)` - checking utf8 is `O(N)`
+    pub fn try_new(
+        data_type: DataType,
+        offsets: OffsetsBuffer<O>,
+        values: Buffer<u8>,
+        validity: Option<Bitmap>,
+    ) -> Result<Self> {
+        try_check_utf8(&offsets, &values)?;
+        if validity
+            .as_ref()
+            .map_or(false, |validity| validity.len() != offsets.len_proxy())
+        {
+            return Err(Error::oos(
+                "validity mask length must match the number of values",
+            ));
+        }
+
+        if data_type.to_physical_type() != Self::default_data_type().to_physical_type() {
+            return Err(Error::oos(
+                "Utf8Array can only be initialized with DataType::Utf8 or DataType::LargeUtf8",
+            ));
+        }
+
+        Ok(Self {
+            data_type,
+            offsets,
+            values,
+            validity,
+        })
+    }
+
+    /// Returns a [`Utf8Array`] from a slice of `&str`.
+    ///
+    /// A convenience method that uses [`Self::from_trusted_len_values_iter`].
+    pub fn from_slice<T: AsRef<str>, P: AsRef<[T]>>(slice: P) -> Self {
+        Self::from_trusted_len_values_iter(slice.as_ref().iter())
+    }
+
+    /// Returns a new [`Utf8Array`] from a slice of `&str`.
+    ///
+    /// A convenience method that uses [`Self::from_trusted_len_iter`].
+    // Note: this can't be `impl From` because Rust does not allow double `AsRef` on it.
+    pub fn from<T: AsRef<str>, P: AsRef<[Option<T>]>>(slice: P) -> Self {
+        MutableUtf8Array::<O>::from(slice).into()
+    }
+
+    /// Returns an iterator of `Option<&str>`
+    pub fn iter(&self) -> ZipValidity<&str, Utf8ValuesIter<O>, BitmapIter> {
+        ZipValidity::new_with_validity(self.values_iter(), self.validity())
+    }
+
+    /// Returns an iterator of `&str`
+    pub fn values_iter(&self) -> Utf8ValuesIter<O> {
+        Utf8ValuesIter::new(self)
+    }
+
+    /// Returns the length of this array
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.offsets.len_proxy()
+    }
+
+    /// Returns the value of the element at index `i`, ignoring the array's validity.
+    /// # Panic
+    /// This function panics iff `i >= self.len`.
+    #[inline]
+    pub fn value(&self, i: usize) -> &str {
+        assert!(i < self.len());
+        unsafe { self.value_unchecked(i) }
+    }
+
+    /// Returns the value of the element at index `i`, ignoring the array's validity.
+    /// # Safety
+    /// This function is safe iff `i < self.len`.
+    #[inline]
+    pub unsafe fn value_unchecked(&self, i: usize) -> &str {
+        // soundness: the invariant of the function
+        let (start, end) = self.offsets.start_end_unchecked(i);
+
+        // soundness: the invariant of the struct
+        let slice = self.values.get_unchecked(start..end);
+
+        // soundness: the invariant of the struct
+        std::str::from_utf8_unchecked(slice)
+    }
+
+    /// Returns the element at index `i` or `None` if it is null
+    /// # Panics
+    /// iff `i >= self.len()`
+    #[inline]
+    pub fn get(&self, i: usize) -> Option<&str> {
+        if !self.is_null(i) {
+            // soundness: Array::is_null panics if i >= self.len
+            unsafe { Some(self.value_unchecked(i)) }
+        } else {
+            None
+        }
+    }
+
+    /// Returns the [`DataType`] of this array.
+    #[inline]
+    pub fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    /// Returns the values of this [`Utf8Array`].
+    #[inline]
+    pub fn values(&self) -> &Buffer<u8> {
+        &self.values
+    }
+
+    /// Returns the offsets of this [`Utf8Array`].
+    #[inline]
+    pub fn offsets(&self) -> &OffsetsBuffer<O> {
+        &self.offsets
+    }
+
+    /// The optional validity.
+    #[inline]
+    pub fn validity(&self) -> Option<&Bitmap> {
+        self.validity.as_ref()
+    }
+
+    /// Slices this [`Utf8Array`].
+    /// # Implementation
+    /// This function is `O(1)`.
+    /// # Panics
+    /// iff `offset + length > self.len()`.
+    pub fn slice(&mut self, offset: usize, length: usize) {
+        assert!(
+            offset + length <= self.len(),
+            "the offset of the new array cannot exceed the arrays' length"
+        );
+        unsafe { self.slice_unchecked(offset, length) }
+    }
+
+    /// Slices this [`Utf8Array`].
+    /// # Implementation
+    /// This function is `O(1)`
+    /// # Safety
+    /// The caller must ensure that `offset + length <= self.len()`.
+    pub unsafe fn slice_unchecked(&mut self, offset: usize, length: usize) {
+        self.validity.as_mut().and_then(|bitmap| {
+            bitmap.slice_unchecked(offset, length);
+            (bitmap.unset_bits() > 0).then(|| bitmap)
+        });
+        self.offsets.slice_unchecked(offset, length + 1);
+    }
+
+    impl_sliced!();
+    impl_mut_validity!();
+    impl_into_array!();
+
+    /// Returns its internal representation
+    #[must_use]
+    pub fn into_inner(self) -> (DataType, OffsetsBuffer<O>, Buffer<u8>, Option<Bitmap>) {
+        let Self {
+            data_type,
+            offsets,
+            values,
+            validity,
+        } = self;
+        (data_type, offsets, values, validity)
+    }
+
+    /// Try to convert this `Utf8Array` to a `MutableUtf8Array`
+    #[must_use]
+    pub fn into_mut(self) -> Either<Self, MutableUtf8Array<O>> {
+        use Either::*;
+        if let Some(bitmap) = self.validity {
+            match bitmap.into_mut() {
+                // Safety: invariants are preserved
+                Left(bitmap) => Left(unsafe {
+                    Utf8Array::new_unchecked(
+                        self.data_type,
+                        self.offsets,
+                        self.values,
+                        Some(bitmap),
+                    )
+                }),
+                Right(mutable_bitmap) => match (self.values.into_mut(), self.offsets.into_mut()) {
+                    (Left(values), Left(offsets)) => {
+                        // Safety: invariants are preserved
+                        Left(unsafe {
+                            Utf8Array::new_unchecked(
+                                self.data_type,
+                                offsets,
+                                values,
+                                Some(mutable_bitmap.into()),
+                            )
+                        })
+                    },
+                    (Left(values), Right(offsets)) => {
+                        // Safety: invariants are preserved
+                        Left(unsafe {
+                            Utf8Array::new_unchecked(
+                                self.data_type,
+                                offsets.into(),
+                                values,
+                                Some(mutable_bitmap.into()),
+                            )
+                        })
+                    },
+                    (Right(values), Left(offsets)) => {
+                        // Safety: invariants are preserved
+                        Left(unsafe {
+                            Utf8Array::new_unchecked(
+                                self.data_type,
+                                offsets,
+                                values.into(),
+                                Some(mutable_bitmap.into()),
+                            )
+                        })
+                    },
+                    (Right(values), Right(offsets)) => Right(unsafe {
+                        MutableUtf8Array::new_unchecked(
+                            self.data_type,
+                            offsets,
+                            values,
+                            Some(mutable_bitmap),
+                        )
+                    }),
+                },
+            }
+        } else {
+            match (self.values.into_mut(), self.offsets.into_mut()) {
+                (Left(values), Left(offsets)) => {
+                    Left(unsafe { Utf8Array::new_unchecked(self.data_type, offsets, values, None) })
+                },
+                (Left(values), Right(offsets)) => Left(unsafe {
+                    Utf8Array::new_unchecked(self.data_type, offsets.into(), values, None)
+                }),
+                (Right(values), Left(offsets)) => Left(unsafe {
+                    Utf8Array::new_unchecked(self.data_type, offsets, values.into(), None)
+                }),
+                (Right(values), Right(offsets)) => Right(unsafe {
+                    MutableUtf8Array::new_unchecked(self.data_type, offsets, values, None)
+                }),
+            }
+        }
+    }
+
+    /// Returns a new empty [`Utf8Array`].
+    ///
+    /// The array is guaranteed to have no elements nor validity.
+    #[inline]
+    pub fn new_empty(data_type: DataType) -> Self {
+        unsafe { Self::new_unchecked(data_type, OffsetsBuffer::new(), Buffer::new(), None) }
+    }
+
+    /// Returns a new [`Utf8Array`] whose all slots are null / `None`.
+    #[inline]
+    pub fn new_null(data_type: DataType, length: usize) -> Self {
+        Self::new(
+            data_type,
+            Offsets::new_zeroed(length).into(),
+            Buffer::new(),
+            Some(Bitmap::new_zeroed(length)),
+        )
+    }
+
+    /// Returns a default [`DataType`] of this array, which depends on the generic parameter `O`: `DataType::Utf8` or `DataType::LargeUtf8`
+    pub fn default_data_type() -> DataType {
+        if O::IS_LARGE {
+            DataType::LargeUtf8
+        } else {
+            DataType::Utf8
+        }
+    }
+
+    /// Creates a new [`Utf8Array`] without checking for offsets monotinicity nor utf8-validity
+    ///
+    /// # Errors
+    /// This function returns an error iff:
+    /// * The last offset is not equal to the values' length.
+    /// * the validity's length is not equal to `offsets.len()`.
+    /// * The `data_type`'s [`crate::datatypes::PhysicalType`] is not equal to either `Utf8` or `LargeUtf8`.
+    /// # Safety
+    /// This function is unsound iff:
+    /// * The `values` between two consecutive `offsets` are not valid utf8
+    /// # Implementation
+    /// This function is `O(1)`
+    pub unsafe fn try_new_unchecked(
+        data_type: DataType,
+        offsets: OffsetsBuffer<O>,
+        values: Buffer<u8>,
+        validity: Option<Bitmap>,
+    ) -> Result<Self> {
+        try_check_offsets_bounds(&offsets, values.len())?;
+
+        if validity
+            .as_ref()
+            .map_or(false, |validity| validity.len() != offsets.len_proxy())
+        {
+            return Err(Error::oos(
+                "validity mask length must match the number of values",
+            ));
+        }
+
+        if data_type.to_physical_type() != Self::default_data_type().to_physical_type() {
+            return Err(Error::oos(
+                "BinaryArray can only be initialized with DataType::Utf8 or DataType::LargeUtf8",
+            ));
+        }
+
+        Ok(Self {
+            data_type,
+            offsets,
+            values,
+            validity,
+        })
+    }
+
+    /// Creates a new [`Utf8Array`].
+    /// # Panics
+    /// This function panics iff:
+    /// * The last offset is not equal to the values' length.
+    /// * the validity's length is not equal to `offsets.len()`.
+    /// * The `data_type`'s [`crate::datatypes::PhysicalType`] is not equal to either `Utf8` or `LargeUtf8`.
+    /// * The `values` between two consecutive `offsets` are not valid utf8
+    /// # Implementation
+    /// This function is `O(N)` - checking utf8 is `O(N)`
+    pub fn new(
+        data_type: DataType,
+        offsets: OffsetsBuffer<O>,
+        values: Buffer<u8>,
+        validity: Option<Bitmap>,
+    ) -> Self {
+        Self::try_new(data_type, offsets, values, validity).unwrap()
+    }
+
+    /// Creates a new [`Utf8Array`] without checking for offsets monotinicity.
+    ///
+    /// # Errors
+    /// This function returns an error iff:
+    /// * The last offset is not equal to the values' length.
+    /// * the validity's length is not equal to `offsets.len()`.
+    /// * The `data_type`'s [`crate::datatypes::PhysicalType`] is not equal to either `Utf8` or `LargeUtf8`.
+    /// # Safety
+    /// This function is unsound iff:
+    /// * the offsets are not monotonically increasing
+    /// * The `values` between two consecutive `offsets` are not valid utf8
+    /// # Implementation
+    /// This function is `O(1)`
+    pub unsafe fn new_unchecked(
+        data_type: DataType,
+        offsets: OffsetsBuffer<O>,
+        values: Buffer<u8>,
+        validity: Option<Bitmap>,
+    ) -> Self {
+        Self::try_new_unchecked(data_type, offsets, values, validity).unwrap()
+    }
+
+    /// Returns a (non-null) [`Utf8Array`] created from a [`TrustedLen`] of `&str`.
+    /// # Implementation
+    /// This function is `O(N)`
+    #[inline]
+    pub fn from_trusted_len_values_iter<T: AsRef<str>, I: TrustedLen<Item = T>>(
+        iterator: I,
+    ) -> Self {
+        MutableUtf8Array::<O>::from_trusted_len_values_iter(iterator).into()
+    }
+
+    /// Creates a new [`Utf8Array`] from a [`Iterator`] of `&str`.
+    pub fn from_iter_values<T: AsRef<str>, I: Iterator<Item = T>>(iterator: I) -> Self {
+        MutableUtf8Array::<O>::from_iter_values(iterator).into()
+    }
+
+    /// Creates a [`Utf8Array`] from an iterator of trusted length.
+    /// # Safety
+    /// The iterator must be [`TrustedLen`](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+    /// I.e. that `size_hint().1` correctly reports its length.
+    #[inline]
+    pub unsafe fn from_trusted_len_iter_unchecked<I, P>(iterator: I) -> Self
+    where
+        P: AsRef<str>,
+        I: Iterator<Item = Option<P>>,
+    {
+        MutableUtf8Array::<O>::from_trusted_len_iter_unchecked(iterator).into()
+    }
+
+    /// Creates a [`Utf8Array`] from an iterator of trusted length.
+    #[inline]
+    pub fn from_trusted_len_iter<I, P>(iterator: I) -> Self
+    where
+        P: AsRef<str>,
+        I: TrustedLen<Item = Option<P>>,
+    {
+        MutableUtf8Array::<O>::from_trusted_len_iter(iterator).into()
+    }
+
+    /// Creates a [`Utf8Array`] from an falible iterator of trusted length.
+    /// # Safety
+    /// The iterator must be [`TrustedLen`](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+    /// I.e. that `size_hint().1` correctly reports its length.
+    #[inline]
+    pub unsafe fn try_from_trusted_len_iter_unchecked<E, I, P>(
+        iterator: I,
+    ) -> std::result::Result<Self, E>
+    where
+        P: AsRef<str>,
+        I: IntoIterator<Item = std::result::Result<Option<P>, E>>,
+    {
+        MutableUtf8Array::<O>::try_from_trusted_len_iter_unchecked(iterator).map(|x| x.into())
+    }
+
+    /// Creates a [`Utf8Array`] from an fallible iterator of trusted length.
+    #[inline]
+    pub fn try_from_trusted_len_iter<E, I, P>(iter: I) -> std::result::Result<Self, E>
+    where
+        P: AsRef<str>,
+        I: TrustedLen<Item = std::result::Result<Option<P>, E>>,
+    {
+        MutableUtf8Array::<O>::try_from_trusted_len_iter(iter).map(|x| x.into())
+    }
+
+    /// Applies a function `f` to the validity of this array.
+    ///
+    /// This is an API to leverage clone-on-write
+    /// # Panics
+    /// This function panics if the function `f` modifies the length of the [`Bitmap`].
+    pub fn apply_validity<F: FnOnce(Bitmap) -> Bitmap>(&mut self, f: F) {
+        if let Some(validity) = std::mem::take(&mut self.validity) {
+            self.set_validity(Some(f(validity)))
+        }
+    }
+}
+
+impl<O: Offset> Array for Utf8Array<O> {
+    impl_common_array!();
+
+    fn validity(&self) -> Option<&Bitmap> {
+        self.validity.as_ref()
+    }
+
+    #[inline]
+    fn with_validity(&self, validity: Option<Bitmap>) -> Box<dyn Array> {
+        Box::new(self.clone().with_validity(validity))
+    }
+}
+
+unsafe impl<O: Offset> GenericBinaryArray<O> for Utf8Array<O> {
+    #[inline]
+    fn values(&self) -> &[u8] {
+        self.values()
+    }
+
+    #[inline]
+    fn offsets(&self) -> &[O] {
+        self.offsets().buffer()
+    }
+}
+
+impl<O: Offset> Default for Utf8Array<O> {
+    fn default() -> Self {
+        let data_type = if O::IS_LARGE {
+            DataType::LargeUtf8
+        } else {
+            DataType::Utf8
+        };
+        Utf8Array::new(data_type, Default::default(), Default::default(), None)
+    }
+}
diff --git a/crates/nano-arrow/src/array/utf8/mutable.rs b/crates/nano-arrow/src/array/utf8/mutable.rs
new file mode 100644
index 000000000000..3fc47b3eae1d
--- /dev/null
+++ b/crates/nano-arrow/src/array/utf8/mutable.rs
@@ -0,0 +1,549 @@
+use std::iter::FromIterator;
+use std::sync::Arc;
+
+use super::{MutableUtf8ValuesArray, MutableUtf8ValuesIter, StrAsBytes, Utf8Array};
+use crate::array::physical_binary::*;
+use crate::array::{Array, MutableArray, TryExtend, TryExtendFromSelf, TryPush};
+use crate::bitmap::utils::{BitmapIter, ZipValidity};
+use crate::bitmap::{Bitmap, MutableBitmap};
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+use crate::offset::{Offset, Offsets};
+use crate::trusted_len::TrustedLen;
+
+/// A [`MutableArray`] that builds a [`Utf8Array`]. It differs
+/// from [`MutableUtf8ValuesArray`] in that it can build nullable [`Utf8Array`]s.
+#[derive(Debug, Clone)]
+pub struct MutableUtf8Array<O: Offset> {
+    values: MutableUtf8ValuesArray<O>,
+    validity: Option<MutableBitmap>,
+}
+
+impl<O: Offset> From<MutableUtf8Array<O>> for Utf8Array<O> {
+    fn from(other: MutableUtf8Array<O>) -> Self {
+        let validity = other.validity.and_then(|x| {
+            let validity: Option<Bitmap> = x.into();
+            validity
+        });
+        let array: Utf8Array<O> = other.values.into();
+        array.with_validity(validity)
+    }
+}
+
+impl<O: Offset> Default for MutableUtf8Array<O> {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl<O: Offset> MutableUtf8Array<O> {
+    /// Initializes a new empty [`MutableUtf8Array`].
+    pub fn new() -> Self {
+        Self {
+            values: Default::default(),
+            validity: None,
+        }
+    }
+
+    /// Returns a [`MutableUtf8Array`] created from its internal representation.
+    ///
+    /// # Errors
+    /// This function returns an error iff:
+    /// * The last offset is not equal to the values' length.
+    /// * the validity's length is not equal to `offsets.len()`.
+    /// * The `data_type`'s [`crate::datatypes::PhysicalType`] is not equal to either `Utf8` or `LargeUtf8`.
+    /// * The `values` between two consecutive `offsets` are not valid utf8
+    /// # Implementation
+    /// This function is `O(N)` - checking utf8 is `O(N)`
+    pub fn try_new(
+        data_type: DataType,
+        offsets: Offsets<O>,
+        values: Vec<u8>,
+        validity: Option<MutableBitmap>,
+    ) -> Result<Self> {
+        let values = MutableUtf8ValuesArray::try_new(data_type, offsets, values)?;
+
+        if validity
+            .as_ref()
+            .map_or(false, |validity| validity.len() != values.len())
+        {
+            return Err(Error::oos(
+                "validity's length must be equal to the number of values",
+            ));
+        }
+
+        Ok(Self { values, validity })
+    }
+
+    /// Create a [`MutableUtf8Array`] out of low-end APIs.
+    /// # Safety
+    /// The caller must ensure that every value between offsets is a valid utf8.
+    /// # Panics
+    /// This function panics iff:
+    /// * The `offsets` and `values` are inconsistent
+    /// * The validity is not `None` and its length is different from `offsets`'s length minus one.
+    pub unsafe fn new_unchecked(
+        data_type: DataType,
+        offsets: Offsets<O>,
+        values: Vec<u8>,
+        validity: Option<MutableBitmap>,
+    ) -> Self {
+        let values = MutableUtf8ValuesArray::new_unchecked(data_type, offsets, values);
+        if let Some(ref validity) = validity {
+            assert_eq!(values.len(), validity.len());
+        }
+        Self { values, validity }
+    }
+
+    /// Creates a new [`MutableUtf8Array`] from a slice of optional `&[u8]`.
+    // Note: this can't be `impl From` because Rust does not allow double `AsRef` on it.
+    pub fn from<T: AsRef<str>, P: AsRef<[Option<T>]>>(slice: P) -> Self {
+        Self::from_trusted_len_iter(slice.as_ref().iter().map(|x| x.as_ref()))
+    }
+
+    fn default_data_type() -> DataType {
+        Utf8Array::<O>::default_data_type()
+    }
+
+    /// Initializes a new [`MutableUtf8Array`] with a pre-allocated capacity of slots.
+    pub fn with_capacity(capacity: usize) -> Self {
+        Self::with_capacities(capacity, 0)
+    }
+
+    /// Initializes a new [`MutableUtf8Array`] with a pre-allocated capacity of slots and values.
+    pub fn with_capacities(capacity: usize, values: usize) -> Self {
+        Self {
+            values: MutableUtf8ValuesArray::with_capacities(capacity, values),
+            validity: None,
+        }
+    }
+
+    /// Reserves `additional` elements and `additional_values` on the values buffer.
+    pub fn reserve(&mut self, additional: usize, additional_values: usize) {
+        self.values.reserve(additional, additional_values);
+        if let Some(x) = self.validity.as_mut() {
+            x.reserve(additional)
+        }
+    }
+
+    /// Reserves `additional` elements and `additional_values` on the values buffer.
+    pub fn capacity(&self) -> usize {
+        self.values.capacity()
+    }
+
+    /// Returns the length of this array
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.values.len()
+    }
+
+    /// Pushes a new element to the array.
+    /// # Panic
+    /// This operation panics iff the length of all values (in bytes) exceeds `O` maximum value.
+    #[inline]
+    pub fn push<T: AsRef<str>>(&mut self, value: Option<T>) {
+        self.try_push(value).unwrap()
+    }
+
+    /// Returns the value of the element at index `i`, ignoring the array's validity.
+    /// # Safety
+    /// This function is safe iff `i < self.len`.
+    #[inline]
+    pub fn value(&self, i: usize) -> &str {
+        self.values.value(i)
+    }
+
+    /// Returns the value of the element at index `i`, ignoring the array's validity.
+    /// # Safety
+    /// This function is safe iff `i < self.len`.
+    #[inline]
+    pub unsafe fn value_unchecked(&self, i: usize) -> &str {
+        self.values.value_unchecked(i)
+    }
+
+    /// Pop the last entry from [`MutableUtf8Array`].
+    /// This function returns `None` iff this array is empty.
+    pub fn pop(&mut self) -> Option<String> {
+        let value = self.values.pop()?;
+        self.validity
+            .as_mut()
+            .map(|x| x.pop()?.then(|| ()))
+            .unwrap_or_else(|| Some(()))
+            .map(|_| value)
+    }
+
+    fn init_validity(&mut self) {
+        let mut validity = MutableBitmap::with_capacity(self.values.capacity());
+        validity.extend_constant(self.len(), true);
+        validity.set(self.len() - 1, false);
+        self.validity = Some(validity);
+    }
+
+    /// Returns an iterator of `Option<&str>`
+    pub fn iter(&self) -> ZipValidity<&str, MutableUtf8ValuesIter<O>, BitmapIter> {
+        ZipValidity::new(self.values_iter(), self.validity.as_ref().map(|x| x.iter()))
+    }
+
+    /// Converts itself into an [`Array`].
+    pub fn into_arc(self) -> Arc<dyn Array> {
+        let a: Utf8Array<O> = self.into();
+        Arc::new(a)
+    }
+
+    /// Shrinks the capacity of the [`MutableUtf8Array`] to fit its current length.
+    pub fn shrink_to_fit(&mut self) {
+        self.values.shrink_to_fit();
+        if let Some(validity) = &mut self.validity {
+            validity.shrink_to_fit()
+        }
+    }
+
+    /// Extract the low-end APIs from the [`MutableUtf8Array`].
+    pub fn into_data(self) -> (DataType, Offsets<O>, Vec<u8>, Option<MutableBitmap>) {
+        let (data_type, offsets, values) = self.values.into_inner();
+        (data_type, offsets, values, self.validity)
+    }
+
+    /// Returns an iterator of `&str`
+    pub fn values_iter(&self) -> MutableUtf8ValuesIter<O> {
+        self.values.iter()
+    }
+
+    /// Sets the validity.
+    /// # Panic
+    /// Panics iff the validity's len is not equal to the existing values' length.
+    pub fn set_validity(&mut self, validity: Option<MutableBitmap>) {
+        if let Some(validity) = &validity {
+            assert_eq!(self.values.len(), validity.len())
+        }
+        self.validity = validity;
+    }
+
+    /// Applies a function `f` to the validity of this array.
+    ///
+    /// This is an API to leverage clone-on-write
+    /// # Panics
+    /// This function panics if the function `f` modifies the length of the [`Bitmap`].
+    pub fn apply_validity<F: FnOnce(MutableBitmap) -> MutableBitmap>(&mut self, f: F) {
+        if let Some(validity) = std::mem::take(&mut self.validity) {
+            self.set_validity(Some(f(validity)))
+        }
+    }
+}
+
+impl<O: Offset> MutableUtf8Array<O> {
+    /// returns its values.
+    pub fn values(&self) -> &Vec<u8> {
+        self.values.values()
+    }
+
+    /// returns its offsets.
+    pub fn offsets(&self) -> &Offsets<O> {
+        self.values.offsets()
+    }
+}
+
+impl<O: Offset> MutableArray for MutableUtf8Array<O> {
+    fn len(&self) -> usize {
+        self.len()
+    }
+
+    fn validity(&self) -> Option<&MutableBitmap> {
+        self.validity.as_ref()
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        let array: Utf8Array<O> = std::mem::take(self).into();
+        array.boxed()
+    }
+
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        let array: Utf8Array<O> = std::mem::take(self).into();
+        array.arced()
+    }
+
+    fn data_type(&self) -> &DataType {
+        if O::IS_LARGE {
+            &DataType::LargeUtf8
+        } else {
+            &DataType::Utf8
+        }
+    }
+
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    fn as_mut_any(&mut self) -> &mut dyn std::any::Any {
+        self
+    }
+
+    #[inline]
+    fn push_null(&mut self) {
+        self.push::<&str>(None)
+    }
+
+    fn reserve(&mut self, additional: usize) {
+        self.reserve(additional, 0)
+    }
+
+    fn shrink_to_fit(&mut self) {
+        self.shrink_to_fit()
+    }
+}
+
+impl<O: Offset, P: AsRef<str>> FromIterator<Option<P>> for MutableUtf8Array<O> {
+    fn from_iter<I: IntoIterator<Item = Option<P>>>(iter: I) -> Self {
+        Self::try_from_iter(iter).unwrap()
+    }
+}
+
+impl<O: Offset> MutableUtf8Array<O> {
+    /// Extends the [`MutableUtf8Array`] from an iterator of values of trusted len.
+    /// This differs from `extended_trusted_len` which accepts iterator of optional values.
+    #[inline]
+    pub fn extend_trusted_len_values<I, P>(&mut self, iterator: I)
+    where
+        P: AsRef<str>,
+        I: TrustedLen<Item = P>,
+    {
+        unsafe { self.extend_trusted_len_values_unchecked(iterator) }
+    }
+
+    /// Extends the [`MutableUtf8Array`] from an iterator of values.
+    /// This differs from `extended_trusted_len` which accepts iterator of optional values.
+    #[inline]
+    pub fn extend_values<I, P>(&mut self, iterator: I)
+    where
+        P: AsRef<str>,
+        I: Iterator<Item = P>,
+    {
+        let length = self.values.len();
+        self.values.extend(iterator);
+        let additional = self.values.len() - length;
+
+        if let Some(validity) = self.validity.as_mut() {
+            validity.extend_constant(additional, true);
+        }
+    }
+
+    /// Extends the [`MutableUtf8Array`] from an iterator of values of trusted len.
+    /// This differs from `extended_trusted_len_unchecked` which accepts iterator of optional
+    /// values.
+    /// # Safety
+    /// The iterator must be trusted len.
+    #[inline]
+    pub unsafe fn extend_trusted_len_values_unchecked<I, P>(&mut self, iterator: I)
+    where
+        P: AsRef<str>,
+        I: Iterator<Item = P>,
+    {
+        let length = self.values.len();
+        self.values.extend_trusted_len_unchecked(iterator);
+        let additional = self.values.len() - length;
+
+        if let Some(validity) = self.validity.as_mut() {
+            validity.extend_constant(additional, true);
+        }
+    }
+
+    /// Extends the [`MutableUtf8Array`] from an iterator of trusted len.
+    #[inline]
+    pub fn extend_trusted_len<I, P>(&mut self, iterator: I)
+    where
+        P: AsRef<str>,
+        I: TrustedLen<Item = Option<P>>,
+    {
+        unsafe { self.extend_trusted_len_unchecked(iterator) }
+    }
+
+    /// Extends [`MutableUtf8Array`] from an iterator of trusted len.
+    /// # Safety
+    /// The iterator must be trusted len.
+    #[inline]
+    pub unsafe fn extend_trusted_len_unchecked<I, P>(&mut self, iterator: I)
+    where
+        P: AsRef<str>,
+        I: Iterator<Item = Option<P>>,
+    {
+        if self.validity.is_none() {
+            let mut validity = MutableBitmap::new();
+            validity.extend_constant(self.len(), true);
+            self.validity = Some(validity);
+        }
+
+        self.values
+            .extend_from_trusted_len_iter(self.validity.as_mut().unwrap(), iterator);
+    }
+
+    /// Creates a [`MutableUtf8Array`] from an iterator of trusted length.
+    /// # Safety
+    /// The iterator must be [`TrustedLen`](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+    /// I.e. that `size_hint().1` correctly reports its length.
+    #[inline]
+    pub unsafe fn from_trusted_len_iter_unchecked<I, P>(iterator: I) -> Self
+    where
+        P: AsRef<str>,
+        I: Iterator<Item = Option<P>>,
+    {
+        let iterator = iterator.map(|x| x.map(StrAsBytes));
+        let (validity, offsets, values) = trusted_len_unzip(iterator);
+
+        // soundness: P is `str`
+        Self::new_unchecked(Self::default_data_type(), offsets, values, validity)
+    }
+
+    /// Creates a [`MutableUtf8Array`] from an iterator of trusted length.
+    #[inline]
+    pub fn from_trusted_len_iter<I, P>(iterator: I) -> Self
+    where
+        P: AsRef<str>,
+        I: TrustedLen<Item = Option<P>>,
+    {
+        // soundness: I is `TrustedLen`
+        unsafe { Self::from_trusted_len_iter_unchecked(iterator) }
+    }
+
+    /// Creates a [`MutableUtf8Array`] from an iterator of trusted length of `&str`.
+    /// # Safety
+    /// The iterator must be [`TrustedLen`](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+    /// I.e. that `size_hint().1` correctly reports its length.
+    #[inline]
+    pub unsafe fn from_trusted_len_values_iter_unchecked<T: AsRef<str>, I: Iterator<Item = T>>(
+        iterator: I,
+    ) -> Self {
+        MutableUtf8ValuesArray::from_trusted_len_iter_unchecked(iterator).into()
+    }
+
+    /// Creates a new [`MutableUtf8Array`] from a [`TrustedLen`] of `&str`.
+    #[inline]
+    pub fn from_trusted_len_values_iter<T: AsRef<str>, I: TrustedLen<Item = T>>(
+        iterator: I,
+    ) -> Self {
+        // soundness: I is `TrustedLen`
+        unsafe { Self::from_trusted_len_values_iter_unchecked(iterator) }
+    }
+
+    /// Creates a new [`MutableUtf8Array`] from an iterator.
+    /// # Error
+    /// This operation errors iff the total length in bytes on the iterator exceeds `O`'s maximum value.
+    /// (`i32::MAX` or `i64::MAX` respectively).
+    fn try_from_iter<P: AsRef<str>, I: IntoIterator<Item = Option<P>>>(iter: I) -> Result<Self> {
+        let iterator = iter.into_iter();
+        let (lower, _) = iterator.size_hint();
+        let mut array = Self::with_capacity(lower);
+        for item in iterator {
+            array.try_push(item)?;
+        }
+        Ok(array)
+    }
+
+    /// Creates a [`MutableUtf8Array`] from an falible iterator of trusted length.
+    /// # Safety
+    /// The iterator must be [`TrustedLen`](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+    /// I.e. that `size_hint().1` correctly reports its length.
+    #[inline]
+    pub unsafe fn try_from_trusted_len_iter_unchecked<E, I, P>(
+        iterator: I,
+    ) -> std::result::Result<Self, E>
+    where
+        P: AsRef<str>,
+        I: IntoIterator<Item = std::result::Result<Option<P>, E>>,
+    {
+        let iterator = iterator.into_iter();
+
+        let iterator = iterator.map(|x| x.map(|x| x.map(StrAsBytes)));
+        let (validity, offsets, values) = try_trusted_len_unzip(iterator)?;
+
+        // soundness: P is `str`
+        Ok(Self::new_unchecked(
+            Self::default_data_type(),
+            offsets,
+            values,
+            validity,
+        ))
+    }
+
+    /// Creates a [`MutableUtf8Array`] from an falible iterator of trusted length.
+    #[inline]
+    pub fn try_from_trusted_len_iter<E, I, P>(iterator: I) -> std::result::Result<Self, E>
+    where
+        P: AsRef<str>,
+        I: TrustedLen<Item = std::result::Result<Option<P>, E>>,
+    {
+        // soundness: I: TrustedLen
+        unsafe { Self::try_from_trusted_len_iter_unchecked(iterator) }
+    }
+
+    /// Creates a new [`MutableUtf8Array`] from a [`Iterator`] of `&str`.
+    pub fn from_iter_values<T: AsRef<str>, I: Iterator<Item = T>>(iterator: I) -> Self {
+        MutableUtf8ValuesArray::from_iter(iterator).into()
+    }
+
+    /// Extend with a fallible iterator
+    pub fn extend_fallible<T, I, E>(&mut self, iter: I) -> std::result::Result<(), E>
+    where
+        E: std::error::Error,
+        I: IntoIterator<Item = std::result::Result<Option<T>, E>>,
+        T: AsRef<str>,
+    {
+        let mut iter = iter.into_iter();
+        self.reserve(iter.size_hint().0, 0);
+        iter.try_for_each(|x| {
+            self.push(x?);
+            Ok(())
+        })
+    }
+}
+
+impl<O: Offset, T: AsRef<str>> Extend<Option<T>> for MutableUtf8Array<O> {
+    fn extend<I: IntoIterator<Item = Option<T>>>(&mut self, iter: I) {
+        self.try_extend(iter).unwrap();
+    }
+}
+
+impl<O: Offset, T: AsRef<str>> TryExtend<Option<T>> for MutableUtf8Array<O> {
+    fn try_extend<I: IntoIterator<Item = Option<T>>>(&mut self, iter: I) -> Result<()> {
+        let mut iter = iter.into_iter();
+        self.reserve(iter.size_hint().0, 0);
+        iter.try_for_each(|x| self.try_push(x))
+    }
+}
+
+impl<O: Offset, T: AsRef<str>> TryPush<Option<T>> for MutableUtf8Array<O> {
+    #[inline]
+    fn try_push(&mut self, value: Option<T>) -> Result<()> {
+        match value {
+            Some(value) => {
+                self.values.try_push(value.as_ref())?;
+
+                match &mut self.validity {
+                    Some(validity) => validity.push(true),
+                    None => {},
+                }
+            },
+            None => {
+                self.values.push("");
+                match &mut self.validity {
+                    Some(validity) => validity.push(false),
+                    None => self.init_validity(),
+                }
+            },
+        }
+        Ok(())
+    }
+}
+
+impl<O: Offset> PartialEq for MutableUtf8Array<O> {
+    fn eq(&self, other: &Self) -> bool {
+        self.iter().eq(other.iter())
+    }
+}
+
+impl<O: Offset> TryExtendFromSelf for MutableUtf8Array<O> {
+    fn try_extend_from_self(&mut self, other: &Self) -> Result<()> {
+        extend_validity(self.len(), &mut self.validity, &other.validity);
+
+        self.values.try_extend_from_self(&other.values)
+    }
+}
diff --git a/crates/nano-arrow/src/array/utf8/mutable_values.rs b/crates/nano-arrow/src/array/utf8/mutable_values.rs
new file mode 100644
index 000000000000..8810d30febb5
--- /dev/null
+++ b/crates/nano-arrow/src/array/utf8/mutable_values.rs
@@ -0,0 +1,407 @@
+use std::iter::FromIterator;
+use std::sync::Arc;
+
+use super::{MutableUtf8Array, StrAsBytes, Utf8Array};
+use crate::array::physical_binary::*;
+use crate::array::specification::{try_check_offsets_bounds, try_check_utf8};
+use crate::array::{Array, ArrayValuesIter, MutableArray, TryExtend, TryExtendFromSelf, TryPush};
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+use crate::offset::{Offset, Offsets};
+use crate::trusted_len::TrustedLen;
+
+/// A [`MutableArray`] that builds a [`Utf8Array`]. It differs
+/// from [`MutableUtf8Array`] in that it builds non-null [`Utf8Array`].
+#[derive(Debug, Clone)]
+pub struct MutableUtf8ValuesArray<O: Offset> {
+    data_type: DataType,
+    offsets: Offsets<O>,
+    values: Vec<u8>,
+}
+
+impl<O: Offset> From<MutableUtf8ValuesArray<O>> for Utf8Array<O> {
+    fn from(other: MutableUtf8ValuesArray<O>) -> Self {
+        // Safety:
+        // `MutableUtf8ValuesArray` has the same invariants as `Utf8Array` and thus
+        // `Utf8Array` can be safely created from `MutableUtf8ValuesArray` without checks.
+        unsafe {
+            Utf8Array::<O>::new_unchecked(
+                other.data_type,
+                other.offsets.into(),
+                other.values.into(),
+                None,
+            )
+        }
+    }
+}
+
+impl<O: Offset> From<MutableUtf8ValuesArray<O>> for MutableUtf8Array<O> {
+    fn from(other: MutableUtf8ValuesArray<O>) -> Self {
+        // Safety:
+        // `MutableUtf8ValuesArray` has the same invariants as `MutableUtf8Array`
+        unsafe {
+            MutableUtf8Array::<O>::new_unchecked(other.data_type, other.offsets, other.values, None)
+        }
+    }
+}
+
+impl<O: Offset> Default for MutableUtf8ValuesArray<O> {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl<O: Offset> MutableUtf8ValuesArray<O> {
+    /// Returns an empty [`MutableUtf8ValuesArray`].
+    pub fn new() -> Self {
+        Self {
+            data_type: Self::default_data_type(),
+            offsets: Offsets::new(),
+            values: Vec::<u8>::new(),
+        }
+    }
+
+    /// Returns a [`MutableUtf8ValuesArray`] created from its internal representation.
+    ///
+    /// # Errors
+    /// This function returns an error iff:
+    /// * The last offset is not equal to the values' length.
+    /// * The `data_type`'s [`crate::datatypes::PhysicalType`] is not equal to either `Utf8` or `LargeUtf8`.
+    /// * The `values` between two consecutive `offsets` are not valid utf8
+    /// # Implementation
+    /// This function is `O(N)` - checking utf8 is `O(N)`
+    pub fn try_new(data_type: DataType, offsets: Offsets<O>, values: Vec<u8>) -> Result<Self> {
+        try_check_utf8(&offsets, &values)?;
+        if data_type.to_physical_type() != Self::default_data_type().to_physical_type() {
+            return Err(Error::oos(
+                "MutableUtf8ValuesArray can only be initialized with DataType::Utf8 or DataType::LargeUtf8",
+            ));
+        }
+
+        Ok(Self {
+            data_type,
+            offsets,
+            values,
+        })
+    }
+
+    /// Returns a [`MutableUtf8ValuesArray`] created from its internal representation.
+    ///
+    /// # Panic
+    /// This function does not panic iff:
+    /// * The last offset is equal to the values' length.
+    /// * The `data_type`'s [`crate::datatypes::PhysicalType`] is equal to either `Utf8` or `LargeUtf8`.
+    /// # Safety
+    /// This function is safe iff:
+    /// * the offsets are monotonically increasing
+    /// * The `values` between two consecutive `offsets` are not valid utf8
+    /// # Implementation
+    /// This function is `O(1)`
+    pub unsafe fn new_unchecked(data_type: DataType, offsets: Offsets<O>, values: Vec<u8>) -> Self {
+        try_check_offsets_bounds(&offsets, values.len())
+            .expect("The length of the values must be equal to the last offset value");
+
+        if data_type.to_physical_type() != Self::default_data_type().to_physical_type() {
+            panic!("MutableUtf8ValuesArray can only be initialized with DataType::Utf8 or DataType::LargeUtf8")
+        }
+
+        Self {
+            data_type,
+            offsets,
+            values,
+        }
+    }
+
+    /// Returns the default [`DataType`] of this container: [`DataType::Utf8`] or [`DataType::LargeUtf8`]
+    /// depending on the generic [`Offset`].
+    pub fn default_data_type() -> DataType {
+        Utf8Array::<O>::default_data_type()
+    }
+
+    /// Initializes a new [`MutableUtf8ValuesArray`] with a pre-allocated capacity of items.
+    pub fn with_capacity(capacity: usize) -> Self {
+        Self::with_capacities(capacity, 0)
+    }
+
+    /// Initializes a new [`MutableUtf8ValuesArray`] with a pre-allocated capacity of items and values.
+    pub fn with_capacities(capacity: usize, values: usize) -> Self {
+        Self {
+            data_type: Self::default_data_type(),
+            offsets: Offsets::<O>::with_capacity(capacity),
+            values: Vec::<u8>::with_capacity(values),
+        }
+    }
+
+    /// returns its values.
+    #[inline]
+    pub fn values(&self) -> &Vec<u8> {
+        &self.values
+    }
+
+    /// returns its offsets.
+    #[inline]
+    pub fn offsets(&self) -> &Offsets<O> {
+        &self.offsets
+    }
+
+    /// Reserves `additional` elements and `additional_values` on the values.
+    #[inline]
+    pub fn reserve(&mut self, additional: usize, additional_values: usize) {
+        self.offsets.reserve(additional + 1);
+        self.values.reserve(additional_values);
+    }
+
+    /// Returns the capacity in number of items
+    pub fn capacity(&self) -> usize {
+        self.offsets.capacity()
+    }
+
+    /// Returns the length of this array
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.offsets.len_proxy()
+    }
+
+    /// Pushes a new item to the array.
+    /// # Panic
+    /// This operation panics iff the length of all values (in bytes) exceeds `O` maximum value.
+    #[inline]
+    pub fn push<T: AsRef<str>>(&mut self, value: T) {
+        self.try_push(value).unwrap()
+    }
+
+    /// Pop the last entry from [`MutableUtf8ValuesArray`].
+    /// This function returns `None` iff this array is empty.
+    pub fn pop(&mut self) -> Option<String> {
+        if self.len() == 0 {
+            return None;
+        }
+        self.offsets.pop()?;
+        let start = self.offsets.last().to_usize();
+        let value = self.values.split_off(start);
+        // Safety: utf8 is validated on initialization
+        Some(unsafe { String::from_utf8_unchecked(value) })
+    }
+
+    /// Returns the value of the element at index `i`.
+    /// # Panic
+    /// This function panics iff `i >= self.len`.
+    #[inline]
+    pub fn value(&self, i: usize) -> &str {
+        assert!(i < self.len());
+        unsafe { self.value_unchecked(i) }
+    }
+
+    /// Returns the value of the element at index `i`.
+    /// # Safety
+    /// This function is safe iff `i < self.len`.
+    #[inline]
+    pub unsafe fn value_unchecked(&self, i: usize) -> &str {
+        // soundness: the invariant of the function
+        let (start, end) = self.offsets.start_end(i);
+
+        // soundness: the invariant of the struct
+        let slice = self.values.get_unchecked(start..end);
+
+        // soundness: the invariant of the struct
+        std::str::from_utf8_unchecked(slice)
+    }
+
+    /// Returns an iterator of `&str`
+    pub fn iter(&self) -> ArrayValuesIter<Self> {
+        ArrayValuesIter::new(self)
+    }
+
+    /// Shrinks the capacity of the [`MutableUtf8ValuesArray`] to fit its current length.
+    pub fn shrink_to_fit(&mut self) {
+        self.values.shrink_to_fit();
+        self.offsets.shrink_to_fit();
+    }
+
+    /// Extract the low-end APIs from the [`MutableUtf8ValuesArray`].
+    pub fn into_inner(self) -> (DataType, Offsets<O>, Vec<u8>) {
+        (self.data_type, self.offsets, self.values)
+    }
+}
+
+impl<O: Offset> MutableArray for MutableUtf8ValuesArray<O> {
+    fn len(&self) -> usize {
+        self.len()
+    }
+
+    fn validity(&self) -> Option<&MutableBitmap> {
+        None
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        let array: Utf8Array<O> = std::mem::take(self).into();
+        array.boxed()
+    }
+
+    fn as_arc(&mut self) -> Arc<dyn Array> {
+        let array: Utf8Array<O> = std::mem::take(self).into();
+        array.arced()
+    }
+
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    fn as_mut_any(&mut self) -> &mut dyn std::any::Any {
+        self
+    }
+
+    #[inline]
+    fn push_null(&mut self) {
+        self.push::<&str>("")
+    }
+
+    fn reserve(&mut self, additional: usize) {
+        self.reserve(additional, 0)
+    }
+
+    fn shrink_to_fit(&mut self) {
+        self.shrink_to_fit()
+    }
+}
+
+impl<O: Offset, P: AsRef<str>> FromIterator<P> for MutableUtf8ValuesArray<O> {
+    fn from_iter<I: IntoIterator<Item = P>>(iter: I) -> Self {
+        let (offsets, values) = values_iter(iter.into_iter().map(StrAsBytes));
+        // soundness: T: AsRef<str> and offsets are monotonically increasing
+        unsafe { Self::new_unchecked(Self::default_data_type(), offsets, values) }
+    }
+}
+
+impl<O: Offset> MutableUtf8ValuesArray<O> {
+    pub(crate) unsafe fn extend_from_trusted_len_iter<I, P>(
+        &mut self,
+        validity: &mut MutableBitmap,
+        iterator: I,
+    ) where
+        P: AsRef<str>,
+        I: Iterator<Item = Option<P>>,
+    {
+        let iterator = iterator.map(|x| x.map(StrAsBytes));
+        extend_from_trusted_len_iter(&mut self.offsets, &mut self.values, validity, iterator);
+    }
+
+    /// Extends the [`MutableUtf8ValuesArray`] from a [`TrustedLen`]
+    #[inline]
+    pub fn extend_trusted_len<I, P>(&mut self, iterator: I)
+    where
+        P: AsRef<str>,
+        I: TrustedLen<Item = P>,
+    {
+        unsafe { self.extend_trusted_len_unchecked(iterator) }
+    }
+
+    /// Extends [`MutableUtf8ValuesArray`] from an iterator of trusted len.
+    /// # Safety
+    /// The iterator must be trusted len.
+    #[inline]
+    pub unsafe fn extend_trusted_len_unchecked<I, P>(&mut self, iterator: I)
+    where
+        P: AsRef<str>,
+        I: Iterator<Item = P>,
+    {
+        let iterator = iterator.map(StrAsBytes);
+        extend_from_trusted_len_values_iter(&mut self.offsets, &mut self.values, iterator);
+    }
+
+    /// Creates a [`MutableUtf8ValuesArray`] from a [`TrustedLen`]
+    #[inline]
+    pub fn from_trusted_len_iter<I, P>(iterator: I) -> Self
+    where
+        P: AsRef<str>,
+        I: TrustedLen<Item = P>,
+    {
+        // soundness: I is `TrustedLen`
+        unsafe { Self::from_trusted_len_iter_unchecked(iterator) }
+    }
+
+    /// Returns a new [`MutableUtf8ValuesArray`] from an iterator of trusted length.
+    /// # Safety
+    /// The iterator must be [`TrustedLen`](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+    /// I.e. that `size_hint().1` correctly reports its length.
+    #[inline]
+    pub unsafe fn from_trusted_len_iter_unchecked<I, P>(iterator: I) -> Self
+    where
+        P: AsRef<str>,
+        I: Iterator<Item = P>,
+    {
+        let iterator = iterator.map(StrAsBytes);
+        let (offsets, values) = trusted_len_values_iter(iterator);
+
+        // soundness: P is `str` and offsets are monotonically increasing
+        Self::new_unchecked(Self::default_data_type(), offsets, values)
+    }
+
+    /// Returns a new [`MutableUtf8ValuesArray`] from an iterator.
+    /// # Error
+    /// This operation errors iff the total length in bytes on the iterator exceeds `O`'s maximum value.
+    /// (`i32::MAX` or `i64::MAX` respectively).
+    pub fn try_from_iter<P: AsRef<str>, I: IntoIterator<Item = P>>(iter: I) -> Result<Self> {
+        let iterator = iter.into_iter();
+        let (lower, _) = iterator.size_hint();
+        let mut array = Self::with_capacity(lower);
+        for item in iterator {
+            array.try_push(item)?;
+        }
+        Ok(array)
+    }
+
+    /// Extend with a fallible iterator
+    pub fn extend_fallible<T, I, E>(&mut self, iter: I) -> std::result::Result<(), E>
+    where
+        E: std::error::Error,
+        I: IntoIterator<Item = std::result::Result<T, E>>,
+        T: AsRef<str>,
+    {
+        let mut iter = iter.into_iter();
+        self.reserve(iter.size_hint().0, 0);
+        iter.try_for_each(|x| {
+            self.push(x?);
+            Ok(())
+        })
+    }
+}
+
+impl<O: Offset, T: AsRef<str>> Extend<T> for MutableUtf8ValuesArray<O> {
+    fn extend<I: IntoIterator<Item = T>>(&mut self, iter: I) {
+        extend_from_values_iter(
+            &mut self.offsets,
+            &mut self.values,
+            iter.into_iter().map(StrAsBytes),
+        );
+    }
+}
+
+impl<O: Offset, T: AsRef<str>> TryExtend<T> for MutableUtf8ValuesArray<O> {
+    fn try_extend<I: IntoIterator<Item = T>>(&mut self, iter: I) -> Result<()> {
+        let mut iter = iter.into_iter();
+        self.reserve(iter.size_hint().0, 0);
+        iter.try_for_each(|x| self.try_push(x))
+    }
+}
+
+impl<O: Offset, T: AsRef<str>> TryPush<T> for MutableUtf8ValuesArray<O> {
+    #[inline]
+    fn try_push(&mut self, value: T) -> Result<()> {
+        let bytes = value.as_ref().as_bytes();
+        self.values.extend_from_slice(bytes);
+        self.offsets.try_push_usize(bytes.len())
+    }
+}
+
+impl<O: Offset> TryExtendFromSelf for MutableUtf8ValuesArray<O> {
+    fn try_extend_from_self(&mut self, other: &Self) -> Result<()> {
+        self.values.extend_from_slice(&other.values);
+        self.offsets.try_extend_from_self(&other.offsets)
+    }
+}
diff --git a/crates/nano-arrow/src/bitmap/assign_ops.rs b/crates/nano-arrow/src/bitmap/assign_ops.rs
new file mode 100644
index 000000000000..b4d3702c69eb
--- /dev/null
+++ b/crates/nano-arrow/src/bitmap/assign_ops.rs
@@ -0,0 +1,190 @@
+use super::utils::{BitChunk, BitChunkIterExact, BitChunksExact};
+use crate::bitmap::{Bitmap, MutableBitmap};
+
+/// Applies a function to every bit of this [`MutableBitmap`] in chunks
+///
+/// This function can be for operations like `!` to a [`MutableBitmap`].
+pub fn unary_assign<T: BitChunk, F: Fn(T) -> T>(bitmap: &mut MutableBitmap, op: F) {
+    let mut chunks = bitmap.bitchunks_exact_mut::<T>();
+
+    chunks.by_ref().for_each(|chunk| {
+        let new_chunk: T = match (chunk as &[u8]).try_into() {
+            Ok(a) => T::from_ne_bytes(a),
+            Err(_) => unreachable!(),
+        };
+        let new_chunk = op(new_chunk);
+        chunk.copy_from_slice(new_chunk.to_ne_bytes().as_ref());
+    });
+
+    if chunks.remainder().is_empty() {
+        return;
+    }
+    let mut new_remainder = T::zero().to_ne_bytes();
+    chunks
+        .remainder()
+        .iter()
+        .enumerate()
+        .for_each(|(index, b)| new_remainder[index] = *b);
+    new_remainder = op(T::from_ne_bytes(new_remainder)).to_ne_bytes();
+
+    let len = chunks.remainder().len();
+    chunks
+        .remainder()
+        .copy_from_slice(&new_remainder.as_ref()[..len]);
+}
+
+impl std::ops::Not for MutableBitmap {
+    type Output = Self;
+
+    #[inline]
+    fn not(mut self) -> Self {
+        unary_assign(&mut self, |a: u64| !a);
+        self
+    }
+}
+
+fn binary_assign_impl<I, T, F>(lhs: &mut MutableBitmap, mut rhs: I, op: F)
+where
+    I: BitChunkIterExact<T>,
+    T: BitChunk,
+    F: Fn(T, T) -> T,
+{
+    let mut lhs_chunks = lhs.bitchunks_exact_mut::<T>();
+
+    lhs_chunks
+        .by_ref()
+        .zip(rhs.by_ref())
+        .for_each(|(lhs, rhs)| {
+            let new_chunk: T = match (lhs as &[u8]).try_into() {
+                Ok(a) => T::from_ne_bytes(a),
+                Err(_) => unreachable!(),
+            };
+            let new_chunk = op(new_chunk, rhs);
+            lhs.copy_from_slice(new_chunk.to_ne_bytes().as_ref());
+        });
+
+    let rem_lhs = lhs_chunks.remainder();
+    let rem_rhs = rhs.remainder();
+    if rem_lhs.is_empty() {
+        return;
+    }
+    let mut new_remainder = T::zero().to_ne_bytes();
+    lhs_chunks
+        .remainder()
+        .iter()
+        .enumerate()
+        .for_each(|(index, b)| new_remainder[index] = *b);
+    new_remainder = op(T::from_ne_bytes(new_remainder), rem_rhs).to_ne_bytes();
+
+    let len = lhs_chunks.remainder().len();
+    lhs_chunks
+        .remainder()
+        .copy_from_slice(&new_remainder.as_ref()[..len]);
+}
+
+/// Apply a bitwise binary operation to a [`MutableBitmap`].
+///
+/// This function can be used for operations like `&=` to a [`MutableBitmap`].
+/// # Panics
+/// This function panics iff `lhs.len() != `rhs.len()`
+pub fn binary_assign<T: BitChunk, F>(lhs: &mut MutableBitmap, rhs: &Bitmap, op: F)
+where
+    F: Fn(T, T) -> T,
+{
+    assert_eq!(lhs.len(), rhs.len());
+
+    let (slice, offset, length) = rhs.as_slice();
+    if offset == 0 {
+        let iter = BitChunksExact::<T>::new(slice, length);
+        binary_assign_impl(lhs, iter, op)
+    } else {
+        let rhs_chunks = rhs.chunks::<T>();
+        binary_assign_impl(lhs, rhs_chunks, op)
+    }
+}
+
+#[inline]
+/// Compute bitwise OR operation in-place
+fn or_assign<T: BitChunk>(lhs: &mut MutableBitmap, rhs: &Bitmap) {
+    if rhs.unset_bits() == 0 {
+        assert_eq!(lhs.len(), rhs.len());
+        lhs.clear();
+        lhs.extend_constant(rhs.len(), true);
+    } else if rhs.unset_bits() == rhs.len() {
+        // bitmap remains
+    } else {
+        binary_assign(lhs, rhs, |x: T, y| x | y)
+    }
+}
+
+impl<'a> std::ops::BitOrAssign<&'a Bitmap> for &mut MutableBitmap {
+    #[inline]
+    fn bitor_assign(&mut self, rhs: &'a Bitmap) {
+        or_assign::<u64>(self, rhs)
+    }
+}
+
+impl<'a> std::ops::BitOr<&'a Bitmap> for MutableBitmap {
+    type Output = Self;
+
+    #[inline]
+    fn bitor(mut self, rhs: &'a Bitmap) -> Self {
+        or_assign::<u64>(&mut self, rhs);
+        self
+    }
+}
+
+#[inline]
+/// Compute bitwise `&` between `lhs` and `rhs`, assigning it to `lhs`
+fn and_assign<T: BitChunk>(lhs: &mut MutableBitmap, rhs: &Bitmap) {
+    if rhs.unset_bits() == 0 {
+        // bitmap remains
+    }
+    if rhs.unset_bits() == rhs.len() {
+        assert_eq!(lhs.len(), rhs.len());
+        lhs.clear();
+        lhs.extend_constant(rhs.len(), false);
+    } else {
+        binary_assign(lhs, rhs, |x: T, y| x & y)
+    }
+}
+
+impl<'a> std::ops::BitAndAssign<&'a Bitmap> for &mut MutableBitmap {
+    #[inline]
+    fn bitand_assign(&mut self, rhs: &'a Bitmap) {
+        and_assign::<u64>(self, rhs)
+    }
+}
+
+impl<'a> std::ops::BitAnd<&'a Bitmap> for MutableBitmap {
+    type Output = Self;
+
+    #[inline]
+    fn bitand(mut self, rhs: &'a Bitmap) -> Self {
+        and_assign::<u64>(&mut self, rhs);
+        self
+    }
+}
+
+#[inline]
+/// Compute bitwise XOR operation
+fn xor_assign<T: BitChunk>(lhs: &mut MutableBitmap, rhs: &Bitmap) {
+    binary_assign(lhs, rhs, |x: T, y| x ^ y)
+}
+
+impl<'a> std::ops::BitXorAssign<&'a Bitmap> for &mut MutableBitmap {
+    #[inline]
+    fn bitxor_assign(&mut self, rhs: &'a Bitmap) {
+        xor_assign::<u64>(self, rhs)
+    }
+}
+
+impl<'a> std::ops::BitXor<&'a Bitmap> for MutableBitmap {
+    type Output = Self;
+
+    #[inline]
+    fn bitxor(mut self, rhs: &'a Bitmap) -> Self {
+        xor_assign::<u64>(&mut self, rhs);
+        self
+    }
+}
diff --git a/crates/nano-arrow/src/bitmap/bitmap_ops.rs b/crates/nano-arrow/src/bitmap/bitmap_ops.rs
new file mode 100644
index 000000000000..c83e63255093
--- /dev/null
+++ b/crates/nano-arrow/src/bitmap/bitmap_ops.rs
@@ -0,0 +1,268 @@
+use std::ops::{BitAnd, BitOr, BitXor, Not};
+
+use super::utils::{BitChunk, BitChunkIterExact, BitChunksExact};
+use super::Bitmap;
+use crate::bitmap::MutableBitmap;
+use crate::trusted_len::TrustedLen;
+
+/// Creates a [Vec<u8>] from an [`Iterator`] of [`BitChunk`].
+/// # Safety
+/// The iterator must be [`TrustedLen`].
+pub unsafe fn from_chunk_iter_unchecked<T: BitChunk, I: Iterator<Item = T>>(
+    iterator: I,
+) -> Vec<u8> {
+    let (_, upper) = iterator.size_hint();
+    let upper = upper.expect("try_from_trusted_len_iter requires an upper limit");
+    let len = upper * std::mem::size_of::<T>();
+
+    let mut buffer = Vec::with_capacity(len);
+
+    let mut dst = buffer.as_mut_ptr();
+    for item in iterator {
+        let bytes = item.to_ne_bytes();
+        for i in 0..std::mem::size_of::<T>() {
+            std::ptr::write(dst, bytes[i]);
+            dst = dst.add(1);
+        }
+    }
+    assert_eq!(
+        dst.offset_from(buffer.as_ptr()) as usize,
+        len,
+        "Trusted iterator length was not accurately reported"
+    );
+    buffer.set_len(len);
+    buffer
+}
+
+/// Creates a [`Vec<u8>`] from a [`TrustedLen`] of [`BitChunk`].
+pub fn chunk_iter_to_vec<T: BitChunk, I: TrustedLen<Item = T>>(iter: I) -> Vec<u8> {
+    unsafe { from_chunk_iter_unchecked(iter) }
+}
+
+/// Apply a bitwise operation `op` to four inputs and return the result as a [`Bitmap`].
+pub fn quaternary<F>(a1: &Bitmap, a2: &Bitmap, a3: &Bitmap, a4: &Bitmap, op: F) -> Bitmap
+where
+    F: Fn(u64, u64, u64, u64) -> u64,
+{
+    assert_eq!(a1.len(), a2.len());
+    assert_eq!(a1.len(), a3.len());
+    assert_eq!(a1.len(), a4.len());
+    let a1_chunks = a1.chunks();
+    let a2_chunks = a2.chunks();
+    let a3_chunks = a3.chunks();
+    let a4_chunks = a4.chunks();
+
+    let rem_a1 = a1_chunks.remainder();
+    let rem_a2 = a2_chunks.remainder();
+    let rem_a3 = a3_chunks.remainder();
+    let rem_a4 = a4_chunks.remainder();
+
+    let chunks = a1_chunks
+        .zip(a2_chunks)
+        .zip(a3_chunks)
+        .zip(a4_chunks)
+        .map(|(((a1, a2), a3), a4)| op(a1, a2, a3, a4));
+    let buffer =
+        chunk_iter_to_vec(chunks.chain(std::iter::once(op(rem_a1, rem_a2, rem_a3, rem_a4))));
+
+    let length = a1.len();
+
+    Bitmap::from_u8_vec(buffer, length)
+}
+
+/// Apply a bitwise operation `op` to three inputs and return the result as a [`Bitmap`].
+pub fn ternary<F>(a1: &Bitmap, a2: &Bitmap, a3: &Bitmap, op: F) -> Bitmap
+where
+    F: Fn(u64, u64, u64) -> u64,
+{
+    assert_eq!(a1.len(), a2.len());
+    assert_eq!(a1.len(), a3.len());
+    let a1_chunks = a1.chunks();
+    let a2_chunks = a2.chunks();
+    let a3_chunks = a3.chunks();
+
+    let rem_a1 = a1_chunks.remainder();
+    let rem_a2 = a2_chunks.remainder();
+    let rem_a3 = a3_chunks.remainder();
+
+    let chunks = a1_chunks
+        .zip(a2_chunks)
+        .zip(a3_chunks)
+        .map(|((a1, a2), a3)| op(a1, a2, a3));
+
+    let buffer = chunk_iter_to_vec(chunks.chain(std::iter::once(op(rem_a1, rem_a2, rem_a3))));
+
+    let length = a1.len();
+
+    Bitmap::from_u8_vec(buffer, length)
+}
+
+/// Apply a bitwise operation `op` to two inputs and return the result as a [`Bitmap`].
+pub fn binary<F>(lhs: &Bitmap, rhs: &Bitmap, op: F) -> Bitmap
+where
+    F: Fn(u64, u64) -> u64,
+{
+    assert_eq!(lhs.len(), rhs.len());
+    let lhs_chunks = lhs.chunks();
+    let rhs_chunks = rhs.chunks();
+    let rem_lhs = lhs_chunks.remainder();
+    let rem_rhs = rhs_chunks.remainder();
+
+    let chunks = lhs_chunks
+        .zip(rhs_chunks)
+        .map(|(left, right)| op(left, right));
+
+    let buffer = chunk_iter_to_vec(chunks.chain(std::iter::once(op(rem_lhs, rem_rhs))));
+
+    let length = lhs.len();
+
+    Bitmap::from_u8_vec(buffer, length)
+}
+
+fn unary_impl<F, I>(iter: I, op: F, length: usize) -> Bitmap
+where
+    I: BitChunkIterExact<u64>,
+    F: Fn(u64) -> u64,
+{
+    let rem = op(iter.remainder());
+
+    let iterator = iter.map(op).chain(std::iter::once(rem));
+
+    let buffer = chunk_iter_to_vec(iterator);
+
+    Bitmap::from_u8_vec(buffer, length)
+}
+
+/// Apply a bitwise operation `op` to one input and return the result as a [`Bitmap`].
+pub fn unary<F>(lhs: &Bitmap, op: F) -> Bitmap
+where
+    F: Fn(u64) -> u64,
+{
+    let (slice, offset, length) = lhs.as_slice();
+    if offset == 0 {
+        let iter = BitChunksExact::<u64>::new(slice, length);
+        unary_impl(iter, op, lhs.len())
+    } else {
+        let iter = lhs.chunks::<u64>();
+        unary_impl(iter, op, lhs.len())
+    }
+}
+
+// create a new [`Bitmap`] semantically equal to ``bitmap`` but with an offset equal to ``offset``
+pub(crate) fn align(bitmap: &Bitmap, new_offset: usize) -> Bitmap {
+    let length = bitmap.len();
+
+    let bitmap: Bitmap = std::iter::repeat(false)
+        .take(new_offset)
+        .chain(bitmap.iter())
+        .collect();
+
+    bitmap.sliced(new_offset, length)
+}
+
+#[inline]
+/// Compute bitwise AND operation
+pub fn and(lhs: &Bitmap, rhs: &Bitmap) -> Bitmap {
+    if lhs.unset_bits() == lhs.len() || rhs.unset_bits() == rhs.len() {
+        assert_eq!(lhs.len(), rhs.len());
+        Bitmap::new_zeroed(lhs.len())
+    } else {
+        binary(lhs, rhs, |x, y| x & y)
+    }
+}
+
+#[inline]
+/// Compute bitwise OR operation
+pub fn or(lhs: &Bitmap, rhs: &Bitmap) -> Bitmap {
+    if lhs.unset_bits() == 0 || rhs.unset_bits() == 0 {
+        assert_eq!(lhs.len(), rhs.len());
+        let mut mutable = MutableBitmap::with_capacity(lhs.len());
+        mutable.extend_constant(lhs.len(), true);
+        mutable.into()
+    } else {
+        binary(lhs, rhs, |x, y| x | y)
+    }
+}
+
+#[inline]
+/// Compute bitwise XOR operation
+pub fn xor(lhs: &Bitmap, rhs: &Bitmap) -> Bitmap {
+    let lhs_nulls = lhs.unset_bits();
+    let rhs_nulls = rhs.unset_bits();
+
+    // all false or all true
+    if lhs_nulls == rhs_nulls && rhs_nulls == rhs.len() || lhs_nulls == 0 && rhs_nulls == 0 {
+        assert_eq!(lhs.len(), rhs.len());
+        Bitmap::new_zeroed(rhs.len())
+    }
+    // all false and all true or vice versa
+    else if (lhs_nulls == 0 && rhs_nulls == rhs.len())
+        || (lhs_nulls == lhs.len() && rhs_nulls == 0)
+    {
+        assert_eq!(lhs.len(), rhs.len());
+        let mut mutable = MutableBitmap::with_capacity(lhs.len());
+        mutable.extend_constant(lhs.len(), true);
+        mutable.into()
+    } else {
+        binary(lhs, rhs, |x, y| x ^ y)
+    }
+}
+
+fn eq(lhs: &Bitmap, rhs: &Bitmap) -> bool {
+    if lhs.len() != rhs.len() {
+        return false;
+    }
+
+    let mut lhs_chunks = lhs.chunks::<u64>();
+    let mut rhs_chunks = rhs.chunks::<u64>();
+
+    let equal_chunks = lhs_chunks
+        .by_ref()
+        .zip(rhs_chunks.by_ref())
+        .all(|(left, right)| left == right);
+
+    if !equal_chunks {
+        return false;
+    }
+    let lhs_remainder = lhs_chunks.remainder_iter();
+    let rhs_remainder = rhs_chunks.remainder_iter();
+    lhs_remainder.zip(rhs_remainder).all(|(x, y)| x == y)
+}
+
+impl PartialEq for Bitmap {
+    fn eq(&self, other: &Self) -> bool {
+        eq(self, other)
+    }
+}
+
+impl<'a, 'b> BitOr<&'b Bitmap> for &'a Bitmap {
+    type Output = Bitmap;
+
+    fn bitor(self, rhs: &'b Bitmap) -> Bitmap {
+        or(self, rhs)
+    }
+}
+
+impl<'a, 'b> BitAnd<&'b Bitmap> for &'a Bitmap {
+    type Output = Bitmap;
+
+    fn bitand(self, rhs: &'b Bitmap) -> Bitmap {
+        and(self, rhs)
+    }
+}
+
+impl<'a, 'b> BitXor<&'b Bitmap> for &'a Bitmap {
+    type Output = Bitmap;
+
+    fn bitxor(self, rhs: &'b Bitmap) -> Bitmap {
+        xor(self, rhs)
+    }
+}
+
+impl Not for &Bitmap {
+    type Output = Bitmap;
+
+    fn not(self) -> Bitmap {
+        unary(self, |a| !a)
+    }
+}
diff --git a/crates/nano-arrow/src/bitmap/immutable.rs b/crates/nano-arrow/src/bitmap/immutable.rs
new file mode 100644
index 000000000000..91f1c5942b55
--- /dev/null
+++ b/crates/nano-arrow/src/bitmap/immutable.rs
@@ -0,0 +1,471 @@
+use std::iter::FromIterator;
+use std::ops::Deref;
+use std::sync::Arc;
+
+use either::Either;
+
+use super::utils::{count_zeros, fmt, get_bit, get_bit_unchecked, BitChunk, BitChunks, BitmapIter};
+use super::{chunk_iter_to_vec, IntoIter, MutableBitmap};
+use crate::buffer::Bytes;
+use crate::error::Error;
+use crate::trusted_len::TrustedLen;
+
+/// An immutable container semantically equivalent to `Arc<Vec<bool>>` but represented as `Arc<Vec<u8>>` where
+/// each boolean is represented as a single bit.
+///
+/// # Examples
+/// ```
+/// use arrow2::bitmap::{Bitmap, MutableBitmap};
+///
+/// let bitmap = Bitmap::from([true, false, true]);
+/// assert_eq!(bitmap.iter().collect::<Vec<_>>(), vec![true, false, true]);
+///
+/// // creation directly from bytes
+/// let bitmap = Bitmap::try_new(vec![0b00001101], 5).unwrap();
+/// // note: the first bit is the left-most of the first byte
+/// assert_eq!(bitmap.iter().collect::<Vec<_>>(), vec![true, false, true, true, false]);
+/// // we can also get the slice:
+/// assert_eq!(bitmap.as_slice(), ([0b00001101u8].as_ref(), 0, 5));
+/// // debug helps :)
+/// assert_eq!(format!("{:?}", bitmap), "[0b___01101]".to_string());
+///
+/// // it supports copy-on-write semantics (to a `MutableBitmap`)
+/// let bitmap: MutableBitmap = bitmap.into_mut().right().unwrap();
+/// assert_eq!(bitmap, MutableBitmap::from([true, false, true, true, false]));
+///
+/// // slicing is 'O(1)' (data is shared)
+/// let bitmap = Bitmap::try_new(vec![0b00001101], 5).unwrap();
+/// let mut sliced = bitmap.clone();
+/// sliced.slice(1, 4);
+/// assert_eq!(sliced.as_slice(), ([0b00001101u8].as_ref(), 1, 4)); // 1 here is the offset:
+/// assert_eq!(format!("{:?}", sliced), "[0b___0110_]".to_string());
+/// // when sliced (or cloned), it is no longer possible to `into_mut`.
+/// let same: Bitmap = sliced.into_mut().left().unwrap();
+/// ```
+#[derive(Clone)]
+pub struct Bitmap {
+    bytes: Arc<Bytes<u8>>,
+    // both are measured in bits. They are used to bound the bitmap to a region of Bytes.
+    offset: usize,
+    length: usize,
+    // this is a cache: it is computed on initialization
+    unset_bits: usize,
+}
+
+impl std::fmt::Debug for Bitmap {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        let (bytes, offset, len) = self.as_slice();
+        fmt(bytes, offset, len, f)
+    }
+}
+
+impl Default for Bitmap {
+    fn default() -> Self {
+        MutableBitmap::new().into()
+    }
+}
+
+pub(super) fn check(bytes: &[u8], offset: usize, length: usize) -> Result<(), Error> {
+    if offset + length > bytes.len().saturating_mul(8) {
+        return Err(Error::InvalidArgumentError(format!(
+            "The offset + length of the bitmap ({}) must be `<=` to the number of bytes times 8 ({})",
+            offset + length,
+            bytes.len().saturating_mul(8)
+        )));
+    }
+    Ok(())
+}
+
+impl Bitmap {
+    /// Initializes an empty [`Bitmap`].
+    #[inline]
+    pub fn new() -> Self {
+        Self::default()
+    }
+
+    /// Initializes a new [`Bitmap`] from vector of bytes and a length.
+    /// # Errors
+    /// This function errors iff `length > bytes.len() * 8`
+    #[inline]
+    pub fn try_new(bytes: Vec<u8>, length: usize) -> Result<Self, Error> {
+        check(&bytes, 0, length)?;
+        let unset_bits = count_zeros(&bytes, 0, length);
+        Ok(Self {
+            length,
+            offset: 0,
+            bytes: Arc::new(bytes.into()),
+            unset_bits,
+        })
+    }
+
+    /// Returns the length of the [`Bitmap`].
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.length
+    }
+
+    /// Returns whether [`Bitmap`] is empty
+    #[inline]
+    pub fn is_empty(&self) -> bool {
+        self.len() == 0
+    }
+
+    /// Returns a new iterator of `bool` over this bitmap
+    pub fn iter(&self) -> BitmapIter {
+        BitmapIter::new(&self.bytes, self.offset, self.length)
+    }
+
+    /// Returns an iterator over bits in bit chunks [`BitChunk`].
+    ///
+    /// This iterator is useful to operate over multiple bits via e.g. bitwise.
+    pub fn chunks<T: BitChunk>(&self) -> BitChunks<T> {
+        BitChunks::new(&self.bytes, self.offset, self.length)
+    }
+
+    /// Returns the byte slice of this [`Bitmap`].
+    ///
+    /// The returned tuple contains:
+    /// * `.1`: The byte slice, truncated to the start of the first bit. So the start of the slice
+    ///       is within the first 8 bits.
+    /// * `.2`: The start offset in bits on a range `0 <= offsets < 8`.
+    /// * `.3`: The length in number of bits.
+    #[inline]
+    pub fn as_slice(&self) -> (&[u8], usize, usize) {
+        let start = self.offset / 8;
+        let len = (self.offset % 8 + self.length).saturating_add(7) / 8;
+        (
+            &self.bytes[start..start + len],
+            self.offset % 8,
+            self.length,
+        )
+    }
+
+    /// Returns the number of unset bits on this [`Bitmap`].
+    ///
+    /// Guaranteed to be `<= self.len()`.
+    /// # Implementation
+    /// This function is `O(1)` - the number of unset bits is computed when the bitmap is
+    /// created
+    pub const fn unset_bits(&self) -> usize {
+        self.unset_bits
+    }
+
+    /// Returns the number of unset bits on this [`Bitmap`].
+    #[inline]
+    #[deprecated(since = "0.13.0", note = "use `unset_bits` instead")]
+    pub fn null_count(&self) -> usize {
+        self.unset_bits
+    }
+
+    /// Slices `self`, offsetting by `offset` and truncating up to `length` bits.
+    /// # Panic
+    /// Panics iff `offset + length > self.length`, i.e. if the offset and `length`
+    /// exceeds the allocated capacity of `self`.
+    #[inline]
+    pub fn slice(&mut self, offset: usize, length: usize) {
+        assert!(offset + length <= self.length);
+        unsafe { self.slice_unchecked(offset, length) }
+    }
+
+    /// Slices `self`, offsetting by `offset` and truncating up to `length` bits.
+    /// # Safety
+    /// The caller must ensure that `self.offset + offset + length <= self.len()`
+    #[inline]
+    pub unsafe fn slice_unchecked(&mut self, offset: usize, length: usize) {
+        // first guard a no-op slice so that we don't do a bitcount
+        // if there isn't any data sliced
+        if !(offset == 0 && length == self.length) {
+            // count the smallest chunk
+            if length < self.length / 2 {
+                // count the null values in the slice
+                self.unset_bits = count_zeros(&self.bytes, self.offset + offset, length);
+            } else {
+                // subtract the null count of the chunks we slice off
+                let start_end = self.offset + offset + length;
+                let head_count = count_zeros(&self.bytes, self.offset, offset);
+                let tail_count = count_zeros(&self.bytes, start_end, self.length - length - offset);
+                self.unset_bits -= head_count + tail_count;
+            }
+            self.offset += offset;
+            self.length = length;
+        }
+    }
+
+    /// Slices `self`, offsetting by `offset` and truncating up to `length` bits.
+    /// # Panic
+    /// Panics iff `offset + length > self.length`, i.e. if the offset and `length`
+    /// exceeds the allocated capacity of `self`.
+    #[inline]
+    #[must_use]
+    pub fn sliced(self, offset: usize, length: usize) -> Self {
+        assert!(offset + length <= self.length);
+        unsafe { self.sliced_unchecked(offset, length) }
+    }
+
+    /// Slices `self`, offsetting by `offset` and truncating up to `length` bits.
+    /// # Safety
+    /// The caller must ensure that `self.offset + offset + length <= self.len()`
+    #[inline]
+    #[must_use]
+    pub unsafe fn sliced_unchecked(mut self, offset: usize, length: usize) -> Self {
+        self.slice_unchecked(offset, length);
+        self
+    }
+
+    /// Returns whether the bit at position `i` is set.
+    /// # Panics
+    /// Panics iff `i >= self.len()`.
+    #[inline]
+    pub fn get_bit(&self, i: usize) -> bool {
+        get_bit(&self.bytes, self.offset + i)
+    }
+
+    /// Unsafely returns whether the bit at position `i` is set.
+    /// # Safety
+    /// Unsound iff `i >= self.len()`.
+    #[inline]
+    pub unsafe fn get_bit_unchecked(&self, i: usize) -> bool {
+        get_bit_unchecked(&self.bytes, self.offset + i)
+    }
+
+    /// Returns a pointer to the start of this [`Bitmap`] (ignores `offsets`)
+    /// This pointer is allocated iff `self.len() > 0`.
+    pub(crate) fn as_ptr(&self) -> *const u8 {
+        self.bytes.deref().as_ptr()
+    }
+
+    /// Returns a pointer to the start of this [`Bitmap`] (ignores `offsets`)
+    /// This pointer is allocated iff `self.len() > 0`.
+    pub(crate) fn offset(&self) -> usize {
+        self.offset
+    }
+
+    /// Converts this [`Bitmap`] to [`MutableBitmap`], returning itself if the conversion
+    /// is not possible
+    ///
+    /// This operation returns a [`MutableBitmap`] iff:
+    /// * this [`Bitmap`] is not an offsetted slice of another [`Bitmap`]
+    /// * this [`Bitmap`] has not been cloned (i.e. [`Arc`]`::get_mut` yields [`Some`])
+    /// * this [`Bitmap`] was not imported from the c data interface (FFI)
+    pub fn into_mut(mut self) -> Either<Self, MutableBitmap> {
+        match (
+            self.offset,
+            Arc::get_mut(&mut self.bytes).and_then(|b| b.get_vec()),
+        ) {
+            (0, Some(v)) => {
+                let data = std::mem::take(v);
+                Either::Right(MutableBitmap::from_vec(data, self.length))
+            },
+            _ => Either::Left(self),
+        }
+    }
+
+    /// Converts this [`Bitmap`] into a [`MutableBitmap`], cloning its internal
+    /// buffer if required (clone-on-write).
+    pub fn make_mut(self) -> MutableBitmap {
+        match self.into_mut() {
+            Either::Left(data) => {
+                if data.offset > 0 {
+                    // re-align the bits (remove the offset)
+                    let chunks = data.chunks::<u64>();
+                    let remainder = chunks.remainder();
+                    let vec = chunk_iter_to_vec(chunks.chain(std::iter::once(remainder)));
+                    MutableBitmap::from_vec(vec, data.length)
+                } else {
+                    MutableBitmap::from_vec(data.bytes.as_ref().to_vec(), data.length)
+                }
+            },
+            Either::Right(data) => data,
+        }
+    }
+
+    /// Initializes an new [`Bitmap`] filled with unset values.
+    #[inline]
+    pub fn new_zeroed(length: usize) -> Self {
+        // don't use `MutableBitmap::from_len_zeroed().into()`
+        // it triggers a bitcount
+        let bytes = vec![0; length.saturating_add(7) / 8];
+        unsafe { Bitmap::from_inner_unchecked(Arc::new(bytes.into()), 0, length, length) }
+    }
+
+    /// Counts the nulls (unset bits) starting from `offset` bits and for `length` bits.
+    #[inline]
+    pub fn null_count_range(&self, offset: usize, length: usize) -> usize {
+        count_zeros(&self.bytes, self.offset + offset, length)
+    }
+
+    /// Creates a new [`Bitmap`] from a slice and length.
+    /// # Panic
+    /// Panics iff `length <= bytes.len() * 8`
+    #[inline]
+    pub fn from_u8_slice<T: AsRef<[u8]>>(slice: T, length: usize) -> Self {
+        Bitmap::try_new(slice.as_ref().to_vec(), length).unwrap()
+    }
+
+    /// Alias for `Bitmap::try_new().unwrap()`
+    /// This function is `O(1)`
+    /// # Panic
+    /// This function panics iff `length <= bytes.len() * 8`
+    #[inline]
+    pub fn from_u8_vec(vec: Vec<u8>, length: usize) -> Self {
+        Bitmap::try_new(vec, length).unwrap()
+    }
+
+    /// Returns whether the bit at position `i` is set.
+    #[inline]
+    pub fn get(&self, i: usize) -> Option<bool> {
+        if i < self.len() {
+            Some(unsafe { self.get_bit_unchecked(i) })
+        } else {
+            None
+        }
+    }
+
+    /// Returns its internal representation
+    #[must_use]
+    pub fn into_inner(self) -> (Arc<Bytes<u8>>, usize, usize, usize) {
+        let Self {
+            bytes,
+            offset,
+            length,
+            unset_bits,
+        } = self;
+        (bytes, offset, length, unset_bits)
+    }
+
+    /// Creates a `[Bitmap]` from its internal representation.
+    /// This is the inverted from `[Bitmap::into_inner]`
+    ///
+    /// # Safety
+    /// The invariants of this struct must be upheld
+    pub unsafe fn from_inner(
+        bytes: Arc<Bytes<u8>>,
+        offset: usize,
+        length: usize,
+        unset_bits: usize,
+    ) -> Result<Self, Error> {
+        check(&bytes, offset, length)?;
+        Ok(Self {
+            bytes,
+            offset,
+            length,
+            unset_bits,
+        })
+    }
+
+    /// Creates a `[Bitmap]` from its internal representation.
+    /// This is the inverted from `[Bitmap::into_inner]`
+    ///
+    /// # Safety
+    /// Callers must ensure all invariants of this struct are upheld.
+    pub unsafe fn from_inner_unchecked(
+        bytes: Arc<Bytes<u8>>,
+        offset: usize,
+        length: usize,
+        unset_bits: usize,
+    ) -> Self {
+        Self {
+            bytes,
+            offset,
+            length,
+            unset_bits,
+        }
+    }
+}
+
+impl<P: AsRef<[bool]>> From<P> for Bitmap {
+    fn from(slice: P) -> Self {
+        Self::from_trusted_len_iter(slice.as_ref().iter().copied())
+    }
+}
+
+impl FromIterator<bool> for Bitmap {
+    fn from_iter<I>(iter: I) -> Self
+    where
+        I: IntoIterator<Item = bool>,
+    {
+        MutableBitmap::from_iter(iter).into()
+    }
+}
+
+impl Bitmap {
+    /// Creates a new [`Bitmap`] from an iterator of booleans.
+    /// # Safety
+    /// The iterator must report an accurate length.
+    #[inline]
+    pub unsafe fn from_trusted_len_iter_unchecked<I: Iterator<Item = bool>>(iterator: I) -> Self {
+        MutableBitmap::from_trusted_len_iter_unchecked(iterator).into()
+    }
+
+    /// Creates a new [`Bitmap`] from an iterator of booleans.
+    #[inline]
+    pub fn from_trusted_len_iter<I: TrustedLen<Item = bool>>(iterator: I) -> Self {
+        MutableBitmap::from_trusted_len_iter(iterator).into()
+    }
+
+    /// Creates a new [`Bitmap`] from a fallible iterator of booleans.
+    #[inline]
+    pub fn try_from_trusted_len_iter<E, I: TrustedLen<Item = std::result::Result<bool, E>>>(
+        iterator: I,
+    ) -> std::result::Result<Self, E> {
+        Ok(MutableBitmap::try_from_trusted_len_iter(iterator)?.into())
+    }
+
+    /// Creates a new [`Bitmap`] from a fallible iterator of booleans.
+    /// # Safety
+    /// The iterator must report an accurate length.
+    #[inline]
+    pub unsafe fn try_from_trusted_len_iter_unchecked<
+        E,
+        I: Iterator<Item = std::result::Result<bool, E>>,
+    >(
+        iterator: I,
+    ) -> std::result::Result<Self, E> {
+        Ok(MutableBitmap::try_from_trusted_len_iter_unchecked(iterator)?.into())
+    }
+
+    /// Create a new [`Bitmap`] from an arrow [`NullBuffer`]
+    ///
+    /// [`NullBuffer`]: arrow_buffer::buffer::NullBuffer
+    #[cfg(feature = "arrow")]
+    pub fn from_null_buffer(value: arrow_buffer::buffer::NullBuffer) -> Self {
+        let offset = value.offset();
+        let length = value.len();
+        let unset_bits = value.null_count();
+        Self {
+            offset,
+            length,
+            unset_bits,
+            bytes: Arc::new(crate::buffer::to_bytes(value.buffer().clone())),
+        }
+    }
+}
+
+impl<'a> IntoIterator for &'a Bitmap {
+    type Item = bool;
+    type IntoIter = BitmapIter<'a>;
+
+    fn into_iter(self) -> Self::IntoIter {
+        BitmapIter::<'a>::new(&self.bytes, self.offset, self.length)
+    }
+}
+
+impl IntoIterator for Bitmap {
+    type Item = bool;
+    type IntoIter = IntoIter;
+
+    fn into_iter(self) -> Self::IntoIter {
+        IntoIter::new(self)
+    }
+}
+
+#[cfg(feature = "arrow")]
+impl From<Bitmap> for arrow_buffer::buffer::NullBuffer {
+    fn from(value: Bitmap) -> Self {
+        let null_count = value.unset_bits;
+        let buffer = crate::buffer::to_buffer(value.bytes);
+        let buffer = arrow_buffer::buffer::BooleanBuffer::new(buffer, value.offset, value.length);
+        // Safety: null count is accurate
+        unsafe { arrow_buffer::buffer::NullBuffer::new_unchecked(buffer, null_count) }
+    }
+}
diff --git a/crates/nano-arrow/src/bitmap/iterator.rs b/crates/nano-arrow/src/bitmap/iterator.rs
new file mode 100644
index 000000000000..93ca7fb8576a
--- /dev/null
+++ b/crates/nano-arrow/src/bitmap/iterator.rs
@@ -0,0 +1,68 @@
+use super::Bitmap;
+use crate::trusted_len::TrustedLen;
+
+/// This crates' equivalent of [`std::vec::IntoIter`] for [`Bitmap`].
+#[derive(Debug, Clone)]
+pub struct IntoIter {
+    values: Bitmap,
+    index: usize,
+    end: usize,
+}
+
+impl IntoIter {
+    /// Creates a new [`IntoIter`] from a [`Bitmap`]
+    #[inline]
+    pub fn new(values: Bitmap) -> Self {
+        let end = values.len();
+        Self {
+            values,
+            index: 0,
+            end,
+        }
+    }
+}
+
+impl Iterator for IntoIter {
+    type Item = bool;
+
+    #[inline]
+    fn next(&mut self) -> Option<Self::Item> {
+        if self.index == self.end {
+            return None;
+        }
+        let old = self.index;
+        self.index += 1;
+        Some(unsafe { self.values.get_bit_unchecked(old) })
+    }
+
+    #[inline]
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        (self.end - self.index, Some(self.end - self.index))
+    }
+
+    #[inline]
+    fn nth(&mut self, n: usize) -> Option<Self::Item> {
+        let new_index = self.index + n;
+        if new_index > self.end {
+            self.index = self.end;
+            None
+        } else {
+            self.index = new_index;
+            self.next()
+        }
+    }
+}
+
+impl DoubleEndedIterator for IntoIter {
+    #[inline]
+    fn next_back(&mut self) -> Option<Self::Item> {
+        if self.index == self.end {
+            None
+        } else {
+            self.end -= 1;
+            Some(unsafe { self.values.get_bit_unchecked(self.end) })
+        }
+    }
+}
+
+unsafe impl TrustedLen for IntoIter {}
diff --git a/crates/nano-arrow/src/bitmap/mod.rs b/crates/nano-arrow/src/bitmap/mod.rs
new file mode 100644
index 000000000000..dea2645c1466
--- /dev/null
+++ b/crates/nano-arrow/src/bitmap/mod.rs
@@ -0,0 +1,17 @@
+//! contains [`Bitmap`] and [`MutableBitmap`], containers of `bool`.
+mod immutable;
+pub use immutable::*;
+
+mod iterator;
+pub use iterator::IntoIter;
+
+mod mutable;
+pub use mutable::MutableBitmap;
+
+mod bitmap_ops;
+pub use bitmap_ops::*;
+
+mod assign_ops;
+pub use assign_ops::*;
+
+pub mod utils;
diff --git a/crates/nano-arrow/src/bitmap/mutable.rs b/crates/nano-arrow/src/bitmap/mutable.rs
new file mode 100644
index 000000000000..e52e39ba3200
--- /dev/null
+++ b/crates/nano-arrow/src/bitmap/mutable.rs
@@ -0,0 +1,755 @@
+use std::hint::unreachable_unchecked;
+use std::iter::FromIterator;
+use std::sync::Arc;
+
+use super::utils::{
+    count_zeros, fmt, get_bit, set, set_bit, BitChunk, BitChunksExactMut, BitmapIter,
+};
+use super::Bitmap;
+use crate::bitmap::utils::{merge_reversed, set_bit_unchecked};
+use crate::error::Error;
+use crate::trusted_len::TrustedLen;
+
+/// A container of booleans. [`MutableBitmap`] is semantically equivalent
+/// to [`Vec<bool>`].
+///
+/// The two main differences against [`Vec<bool>`] is that each element stored as a single bit,
+/// thereby:
+/// * it uses 8x less memory
+/// * it cannot be represented as `&[bool]` (i.e. no pointer arithmetics).
+///
+/// A [`MutableBitmap`] can be converted to a [`Bitmap`] at `O(1)`.
+/// # Examples
+/// ```
+/// use arrow2::bitmap::MutableBitmap;
+///
+/// let bitmap = MutableBitmap::from([true, false, true]);
+/// assert_eq!(bitmap.iter().collect::<Vec<_>>(), vec![true, false, true]);
+///
+/// // creation directly from bytes
+/// let mut bitmap = MutableBitmap::try_new(vec![0b00001101], 5).unwrap();
+/// // note: the first bit is the left-most of the first byte
+/// assert_eq!(bitmap.iter().collect::<Vec<_>>(), vec![true, false, true, true, false]);
+/// // we can also get the slice:
+/// assert_eq!(bitmap.as_slice(), [0b00001101u8].as_ref());
+/// // debug helps :)
+/// assert_eq!(format!("{:?}", bitmap), "[0b___01101]".to_string());
+///
+/// // It supports mutation in place
+/// bitmap.set(0, false);
+/// assert_eq!(format!("{:?}", bitmap), "[0b___01100]".to_string());
+/// // and `O(1)` random access
+/// assert_eq!(bitmap.get(0), false);
+/// ```
+/// # Implementation
+/// This container is internally a [`Vec<u8>`].
+#[derive(Clone)]
+pub struct MutableBitmap {
+    buffer: Vec<u8>,
+    // invariant: length.saturating_add(7) / 8 == buffer.len();
+    length: usize,
+}
+
+impl std::fmt::Debug for MutableBitmap {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        fmt(&self.buffer, 0, self.len(), f)
+    }
+}
+
+impl PartialEq for MutableBitmap {
+    fn eq(&self, other: &Self) -> bool {
+        self.iter().eq(other.iter())
+    }
+}
+
+impl MutableBitmap {
+    /// Initializes an empty [`MutableBitmap`].
+    #[inline]
+    pub fn new() -> Self {
+        Self {
+            buffer: Vec::new(),
+            length: 0,
+        }
+    }
+
+    /// Initializes a new [`MutableBitmap`] from a [`Vec<u8>`] and a length.
+    /// # Errors
+    /// This function errors iff `length > bytes.len() * 8`
+    #[inline]
+    pub fn try_new(bytes: Vec<u8>, length: usize) -> Result<Self, Error> {
+        if length > bytes.len().saturating_mul(8) {
+            return Err(Error::InvalidArgumentError(format!(
+                "The length of the bitmap ({}) must be `<=` to the number of bytes times 8 ({})",
+                length,
+                bytes.len().saturating_mul(8)
+            )));
+        }
+        Ok(Self {
+            length,
+            buffer: bytes,
+        })
+    }
+
+    /// Initializes a [`MutableBitmap`] from a [`Vec<u8>`] and a length.
+    /// This function is `O(1)`.
+    /// # Panic
+    /// Panics iff the length is larger than the length of the buffer times 8.
+    #[inline]
+    pub fn from_vec(buffer: Vec<u8>, length: usize) -> Self {
+        Self::try_new(buffer, length).unwrap()
+    }
+
+    /// Initializes a pre-allocated [`MutableBitmap`] with capacity for `capacity` bits.
+    #[inline]
+    pub fn with_capacity(capacity: usize) -> Self {
+        Self {
+            buffer: Vec::with_capacity(capacity.saturating_add(7) / 8),
+            length: 0,
+        }
+    }
+
+    /// Pushes a new bit to the [`MutableBitmap`], re-sizing it if necessary.
+    #[inline]
+    pub fn push(&mut self, value: bool) {
+        if self.length % 8 == 0 {
+            self.buffer.push(0);
+        }
+        let byte = self.buffer.as_mut_slice().last_mut().unwrap();
+        *byte = set(*byte, self.length % 8, value);
+        self.length += 1;
+    }
+
+    /// Pop the last bit from the [`MutableBitmap`].
+    /// Note if the [`MutableBitmap`] is empty, this method will return None.
+    #[inline]
+    pub fn pop(&mut self) -> Option<bool> {
+        if self.is_empty() {
+            return None;
+        }
+
+        self.length -= 1;
+        let value = self.get(self.length);
+        if self.length % 8 == 0 {
+            self.buffer.pop();
+        }
+        Some(value)
+    }
+
+    /// Returns whether the position `index` is set.
+    /// # Panics
+    /// Panics iff `index >= self.len()`.
+    #[inline]
+    pub fn get(&self, index: usize) -> bool {
+        get_bit(&self.buffer, index)
+    }
+
+    /// Sets the position `index` to `value`
+    /// # Panics
+    /// Panics iff `index >= self.len()`.
+    #[inline]
+    pub fn set(&mut self, index: usize, value: bool) {
+        set_bit(self.buffer.as_mut_slice(), index, value)
+    }
+
+    /// constructs a new iterator over the bits of [`MutableBitmap`].
+    pub fn iter(&self) -> BitmapIter {
+        BitmapIter::new(&self.buffer, 0, self.length)
+    }
+
+    /// Empties the [`MutableBitmap`].
+    #[inline]
+    pub fn clear(&mut self) {
+        self.length = 0;
+        self.buffer.clear();
+    }
+
+    /// Extends [`MutableBitmap`] by `additional` values of constant `value`.
+    /// # Implementation
+    /// This function is an order of magnitude faster than pushing element by element.
+    #[inline]
+    pub fn extend_constant(&mut self, additional: usize, value: bool) {
+        if additional == 0 {
+            return;
+        }
+
+        if value {
+            self.extend_set(additional)
+        } else {
+            self.extend_unset(additional)
+        }
+    }
+
+    /// Initializes a zeroed [`MutableBitmap`].
+    #[inline]
+    pub fn from_len_zeroed(length: usize) -> Self {
+        Self {
+            buffer: vec![0; length.saturating_add(7) / 8],
+            length,
+        }
+    }
+
+    /// Initializes a [`MutableBitmap`] with all values set to valid/ true.
+    #[inline]
+    pub fn from_len_set(length: usize) -> Self {
+        Self {
+            buffer: vec![u8::MAX; length.saturating_add(7) / 8],
+            length,
+        }
+    }
+
+    /// Reserves `additional` bits in the [`MutableBitmap`], potentially re-allocating its buffer.
+    #[inline(always)]
+    pub fn reserve(&mut self, additional: usize) {
+        self.buffer
+            .reserve((self.length + additional).saturating_add(7) / 8 - self.buffer.len())
+    }
+
+    /// Returns the capacity of [`MutableBitmap`] in number of bits.
+    #[inline]
+    pub fn capacity(&self) -> usize {
+        self.buffer.capacity() * 8
+    }
+
+    /// Pushes a new bit to the [`MutableBitmap`]
+    /// # Safety
+    /// The caller must ensure that the [`MutableBitmap`] has sufficient capacity.
+    #[inline]
+    pub unsafe fn push_unchecked(&mut self, value: bool) {
+        if self.length % 8 == 0 {
+            self.buffer.push(0);
+        }
+        let byte = self.buffer.as_mut_slice().last_mut().unwrap();
+        *byte = set(*byte, self.length % 8, value);
+        self.length += 1;
+    }
+
+    /// Returns the number of unset bits on this [`MutableBitmap`].
+    ///
+    /// Guaranteed to be `<= self.len()`.
+    /// # Implementation
+    /// This function is `O(N)`
+    pub fn unset_bits(&self) -> usize {
+        count_zeros(&self.buffer, 0, self.length)
+    }
+
+    /// Returns the number of unset bits on this [`MutableBitmap`].
+    #[deprecated(since = "0.13.0", note = "use `unset_bits` instead")]
+    pub fn null_count(&self) -> usize {
+        self.unset_bits()
+    }
+
+    /// Returns the length of the [`MutableBitmap`].
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.length
+    }
+
+    /// Returns whether [`MutableBitmap`] is empty.
+    #[inline]
+    pub fn is_empty(&self) -> bool {
+        self.len() == 0
+    }
+
+    /// # Safety
+    /// The caller must ensure that the [`MutableBitmap`] was properly initialized up to `len`.
+    #[inline]
+    pub(crate) unsafe fn set_len(&mut self, len: usize) {
+        self.buffer.set_len(len.saturating_add(7) / 8);
+        self.length = len;
+    }
+
+    fn extend_set(&mut self, mut additional: usize) {
+        let offset = self.length % 8;
+        let added = if offset != 0 {
+            // offset != 0 => at least one byte in the buffer
+            let last_index = self.buffer.len() - 1;
+            let last = &mut self.buffer[last_index];
+
+            let remaining = 0b11111111u8;
+            let remaining = remaining >> 8usize.saturating_sub(additional);
+            let remaining = remaining << offset;
+            *last |= remaining;
+            std::cmp::min(additional, 8 - offset)
+        } else {
+            0
+        };
+        self.length += added;
+        additional = additional.saturating_sub(added);
+        if additional > 0 {
+            debug_assert_eq!(self.length % 8, 0);
+            let existing = self.length.saturating_add(7) / 8;
+            let required = (self.length + additional).saturating_add(7) / 8;
+            // add remaining as full bytes
+            self.buffer
+                .extend(std::iter::repeat(0b11111111u8).take(required - existing));
+            self.length += additional;
+        }
+    }
+
+    fn extend_unset(&mut self, mut additional: usize) {
+        let offset = self.length % 8;
+        let added = if offset != 0 {
+            // offset != 0 => at least one byte in the buffer
+            let last_index = self.buffer.len() - 1;
+            let last = &mut self.buffer[last_index];
+            *last &= 0b11111111u8 >> (8 - offset); // unset them
+            std::cmp::min(additional, 8 - offset)
+        } else {
+            0
+        };
+        self.length += added;
+        additional = additional.saturating_sub(added);
+        if additional > 0 {
+            debug_assert_eq!(self.length % 8, 0);
+            self.buffer
+                .resize((self.length + additional).saturating_add(7) / 8, 0);
+            self.length += additional;
+        }
+    }
+
+    /// Sets the position `index` to `value`
+    /// # Safety
+    /// Caller must ensure that `index < self.len()`
+    #[inline]
+    pub unsafe fn set_unchecked(&mut self, index: usize, value: bool) {
+        set_bit_unchecked(self.buffer.as_mut_slice(), index, value)
+    }
+
+    /// Shrinks the capacity of the [`MutableBitmap`] to fit its current length.
+    pub fn shrink_to_fit(&mut self) {
+        self.buffer.shrink_to_fit();
+    }
+
+    /// Returns an iterator over mutable slices, [`BitChunksExactMut`]
+    pub(crate) fn bitchunks_exact_mut<T: BitChunk>(&mut self) -> BitChunksExactMut<T> {
+        BitChunksExactMut::new(&mut self.buffer, self.length)
+    }
+}
+
+impl From<MutableBitmap> for Bitmap {
+    #[inline]
+    fn from(buffer: MutableBitmap) -> Self {
+        Bitmap::try_new(buffer.buffer, buffer.length).unwrap()
+    }
+}
+
+impl From<MutableBitmap> for Option<Bitmap> {
+    #[inline]
+    fn from(buffer: MutableBitmap) -> Self {
+        let unset_bits = buffer.unset_bits();
+        if unset_bits > 0 {
+            // safety:
+            // invariants of the `MutableBitmap` equal that of `Bitmap`
+            let bitmap = unsafe {
+                Bitmap::from_inner_unchecked(
+                    Arc::new(buffer.buffer.into()),
+                    0,
+                    buffer.length,
+                    unset_bits,
+                )
+            };
+            Some(bitmap)
+        } else {
+            None
+        }
+    }
+}
+
+impl<P: AsRef<[bool]>> From<P> for MutableBitmap {
+    #[inline]
+    fn from(slice: P) -> Self {
+        MutableBitmap::from_trusted_len_iter(slice.as_ref().iter().copied())
+    }
+}
+
+impl FromIterator<bool> for MutableBitmap {
+    fn from_iter<I>(iter: I) -> Self
+    where
+        I: IntoIterator<Item = bool>,
+    {
+        let mut iterator = iter.into_iter();
+        let mut buffer = {
+            let byte_capacity: usize = iterator.size_hint().0.saturating_add(7) / 8;
+            Vec::with_capacity(byte_capacity)
+        };
+
+        let mut length = 0;
+
+        loop {
+            let mut exhausted = false;
+            let mut byte_accum: u8 = 0;
+            let mut mask: u8 = 1;
+
+            //collect (up to) 8 bits into a byte
+            while mask != 0 {
+                if let Some(value) = iterator.next() {
+                    length += 1;
+                    byte_accum |= match value {
+                        true => mask,
+                        false => 0,
+                    };
+                    mask <<= 1;
+                } else {
+                    exhausted = true;
+                    break;
+                }
+            }
+
+            // break if the iterator was exhausted before it provided a bool for this byte
+            if exhausted && mask == 1 {
+                break;
+            }
+
+            //ensure we have capacity to write the byte
+            if buffer.len() == buffer.capacity() {
+                //no capacity for new byte, allocate 1 byte more (plus however many more the iterator advertises)
+                let additional_byte_capacity = 1usize.saturating_add(
+                    iterator.size_hint().0.saturating_add(7) / 8, //convert bit count to byte count, rounding up
+                );
+                buffer.reserve(additional_byte_capacity)
+            }
+
+            // Soundness: capacity was allocated above
+            buffer.push(byte_accum);
+            if exhausted {
+                break;
+            }
+        }
+        Self { buffer, length }
+    }
+}
+
+// [7, 6, 5, 4, 3, 2, 1, 0], [15, 14, 13, 12, 11, 10, 9, 8]
+// [00000001_00000000_00000000_00000000_...] // u64
+/// # Safety
+/// The iterator must be trustedLen and its len must be least `len`.
+#[inline]
+unsafe fn get_chunk_unchecked(iterator: &mut impl Iterator<Item = bool>) -> u64 {
+    let mut byte = 0u64;
+    let mut mask;
+    for i in 0..8 {
+        mask = 1u64 << (8 * i);
+        for _ in 0..8 {
+            let value = match iterator.next() {
+                Some(value) => value,
+                None => unsafe { unreachable_unchecked() },
+            };
+
+            byte |= match value {
+                true => mask,
+                false => 0,
+            };
+            mask <<= 1;
+        }
+    }
+    byte
+}
+
+/// # Safety
+/// The iterator must be trustedLen and its len must be least `len`.
+#[inline]
+unsafe fn get_byte_unchecked(len: usize, iterator: &mut impl Iterator<Item = bool>) -> u8 {
+    let mut byte_accum: u8 = 0;
+    let mut mask: u8 = 1;
+    for _ in 0..len {
+        let value = match iterator.next() {
+            Some(value) => value,
+            None => unsafe { unreachable_unchecked() },
+        };
+
+        byte_accum |= match value {
+            true => mask,
+            false => 0,
+        };
+        mask <<= 1;
+    }
+    byte_accum
+}
+
+/// Extends the [`Vec<u8>`] from `iterator`
+/// # Safety
+/// The iterator MUST be [`TrustedLen`].
+#[inline]
+unsafe fn extend_aligned_trusted_iter_unchecked(
+    buffer: &mut Vec<u8>,
+    mut iterator: impl Iterator<Item = bool>,
+) -> usize {
+    let additional_bits = iterator.size_hint().1.unwrap();
+    let chunks = additional_bits / 64;
+    let remainder = additional_bits % 64;
+
+    let additional = (additional_bits + 7) / 8;
+    assert_eq!(
+        additional,
+        // a hint of how the following calculation will be done
+        chunks * 8 + remainder / 8 + (remainder % 8 > 0) as usize
+    );
+    buffer.reserve(additional);
+
+    // chunks of 64 bits
+    for _ in 0..chunks {
+        let chunk = get_chunk_unchecked(&mut iterator);
+        buffer.extend_from_slice(&chunk.to_le_bytes());
+    }
+
+    // remaining complete bytes
+    for _ in 0..(remainder / 8) {
+        let byte = unsafe { get_byte_unchecked(8, &mut iterator) };
+        buffer.push(byte)
+    }
+
+    // remaining bits
+    let remainder = remainder % 8;
+    if remainder > 0 {
+        let byte = unsafe { get_byte_unchecked(remainder, &mut iterator) };
+        buffer.push(byte)
+    }
+    additional_bits
+}
+
+impl MutableBitmap {
+    /// Extends `self` from a [`TrustedLen`] iterator.
+    #[inline]
+    pub fn extend_from_trusted_len_iter<I: TrustedLen<Item = bool>>(&mut self, iterator: I) {
+        // safety: I: TrustedLen
+        unsafe { self.extend_from_trusted_len_iter_unchecked(iterator) }
+    }
+
+    /// Extends `self` from an iterator of trusted len.
+    /// # Safety
+    /// The caller must guarantee that the iterator has a trusted len.
+    #[inline]
+    pub unsafe fn extend_from_trusted_len_iter_unchecked<I: Iterator<Item = bool>>(
+        &mut self,
+        mut iterator: I,
+    ) {
+        // the length of the iterator throughout this function.
+        let mut length = iterator.size_hint().1.unwrap();
+
+        let bit_offset = self.length % 8;
+
+        if length < 8 - bit_offset {
+            if bit_offset == 0 {
+                self.buffer.push(0);
+            }
+            // the iterator will not fill the last byte
+            let byte = self.buffer.as_mut_slice().last_mut().unwrap();
+            let mut i = bit_offset;
+            for value in iterator {
+                *byte = set(*byte, i, value);
+                i += 1;
+            }
+            self.length += length;
+            return;
+        }
+
+        // at this point we know that length will hit a byte boundary and thus
+        // increase the buffer.
+
+        if bit_offset != 0 {
+            // we are in the middle of a byte; lets finish it
+            let byte = self.buffer.as_mut_slice().last_mut().unwrap();
+            (bit_offset..8).for_each(|i| {
+                *byte = set(*byte, i, iterator.next().unwrap());
+            });
+            self.length += 8 - bit_offset;
+            length -= 8 - bit_offset;
+        }
+
+        // everything is aligned; proceed with the bulk operation
+        debug_assert_eq!(self.length % 8, 0);
+
+        unsafe { extend_aligned_trusted_iter_unchecked(&mut self.buffer, iterator) };
+        self.length += length;
+    }
+
+    /// Creates a new [`MutableBitmap`] from an iterator of booleans.
+    /// # Safety
+    /// The iterator must report an accurate length.
+    #[inline]
+    pub unsafe fn from_trusted_len_iter_unchecked<I>(iterator: I) -> Self
+    where
+        I: Iterator<Item = bool>,
+    {
+        let mut buffer = Vec::<u8>::new();
+
+        let length = extend_aligned_trusted_iter_unchecked(&mut buffer, iterator);
+
+        Self { buffer, length }
+    }
+
+    /// Creates a new [`MutableBitmap`] from an iterator of booleans.
+    #[inline]
+    pub fn from_trusted_len_iter<I>(iterator: I) -> Self
+    where
+        I: TrustedLen<Item = bool>,
+    {
+        // Safety: Iterator is `TrustedLen`
+        unsafe { Self::from_trusted_len_iter_unchecked(iterator) }
+    }
+
+    /// Creates a new [`MutableBitmap`] from an iterator of booleans.
+    pub fn try_from_trusted_len_iter<E, I>(iterator: I) -> std::result::Result<Self, E>
+    where
+        I: TrustedLen<Item = std::result::Result<bool, E>>,
+    {
+        unsafe { Self::try_from_trusted_len_iter_unchecked(iterator) }
+    }
+
+    /// Creates a new [`MutableBitmap`] from an falible iterator of booleans.
+    /// # Safety
+    /// The caller must guarantee that the iterator is `TrustedLen`.
+    pub unsafe fn try_from_trusted_len_iter_unchecked<E, I>(
+        mut iterator: I,
+    ) -> std::result::Result<Self, E>
+    where
+        I: Iterator<Item = std::result::Result<bool, E>>,
+    {
+        let length = iterator.size_hint().1.unwrap();
+
+        let mut buffer = vec![0u8; (length + 7) / 8];
+
+        let chunks = length / 8;
+        let reminder = length % 8;
+
+        let data = buffer.as_mut_slice();
+        data[..chunks].iter_mut().try_for_each(|byte| {
+            (0..8).try_for_each(|i| {
+                *byte = set(*byte, i, iterator.next().unwrap()?);
+                Ok(())
+            })
+        })?;
+
+        if reminder != 0 {
+            let last = &mut data[chunks];
+            iterator.enumerate().try_for_each(|(i, value)| {
+                *last = set(*last, i, value?);
+                Ok(())
+            })?;
+        }
+
+        Ok(Self { buffer, length })
+    }
+
+    fn extend_unaligned(&mut self, slice: &[u8], offset: usize, length: usize) {
+        // e.g.
+        // [a, b, --101010]     <- to be extended
+        // [00111111, 11010101] <- to extend
+        // [a, b, 11101010, --001111] expected result
+
+        let aligned_offset = offset / 8;
+        let own_offset = self.length % 8;
+        debug_assert_eq!(offset % 8, 0); // assumed invariant
+        debug_assert!(own_offset != 0); // assumed invariant
+
+        let bytes_len = length.saturating_add(7) / 8;
+        let items = &slice[aligned_offset..aligned_offset + bytes_len];
+        // self has some offset => we need to shift all `items`, and merge the first
+        let buffer = self.buffer.as_mut_slice();
+        let last = &mut buffer[buffer.len() - 1];
+
+        // --101010 | 00111111 << 6 = 11101010
+        // erase previous
+        *last &= 0b11111111u8 >> (8 - own_offset); // unset before setting
+        *last |= items[0] << own_offset;
+
+        if length + own_offset <= 8 {
+            // no new bytes needed
+            self.length += length;
+            return;
+        }
+        let additional = length - (8 - own_offset);
+
+        let remaining = [items[items.len() - 1], 0];
+        let bytes = items
+            .windows(2)
+            .chain(std::iter::once(remaining.as_ref()))
+            .map(|w| merge_reversed(w[0], w[1], 8 - own_offset))
+            .take(additional.saturating_add(7) / 8);
+        self.buffer.extend(bytes);
+
+        self.length += length;
+    }
+
+    fn extend_aligned(&mut self, slice: &[u8], offset: usize, length: usize) {
+        let aligned_offset = offset / 8;
+        let bytes_len = length.saturating_add(7) / 8;
+        let items = &slice[aligned_offset..aligned_offset + bytes_len];
+        self.buffer.extend_from_slice(items);
+        self.length += length;
+    }
+
+    /// Extends the [`MutableBitmap`] from a slice of bytes with optional offset.
+    /// This is the fastest way to extend a [`MutableBitmap`].
+    /// # Implementation
+    /// When both [`MutableBitmap`]'s length and `offset` are both multiples of 8,
+    /// this function performs a memcopy. Else, it first aligns bit by bit and then performs a memcopy.
+    /// # Safety
+    /// Caller must ensure `offset + length <= slice.len() * 8`
+    #[inline]
+    pub unsafe fn extend_from_slice_unchecked(
+        &mut self,
+        slice: &[u8],
+        offset: usize,
+        length: usize,
+    ) {
+        if length == 0 {
+            return;
+        };
+        let is_aligned = self.length % 8 == 0;
+        let other_is_aligned = offset % 8 == 0;
+        match (is_aligned, other_is_aligned) {
+            (true, true) => self.extend_aligned(slice, offset, length),
+            (false, true) => self.extend_unaligned(slice, offset, length),
+            // todo: further optimize the other branches.
+            _ => self.extend_from_trusted_len_iter(BitmapIter::new(slice, offset, length)),
+        }
+        // internal invariant:
+        debug_assert_eq!(self.length.saturating_add(7) / 8, self.buffer.len());
+    }
+
+    /// Extends the [`MutableBitmap`] from a slice of bytes with optional offset.
+    /// This is the fastest way to extend a [`MutableBitmap`].
+    /// # Implementation
+    /// When both [`MutableBitmap`]'s length and `offset` are both multiples of 8,
+    /// this function performs a memcopy. Else, it first aligns bit by bit and then performs a memcopy.
+    #[inline]
+    pub fn extend_from_slice(&mut self, slice: &[u8], offset: usize, length: usize) {
+        assert!(offset + length <= slice.len() * 8);
+        // safety: invariant is asserted
+        unsafe { self.extend_from_slice_unchecked(slice, offset, length) }
+    }
+
+    /// Extends the [`MutableBitmap`] from a [`Bitmap`].
+    #[inline]
+    pub fn extend_from_bitmap(&mut self, bitmap: &Bitmap) {
+        let (slice, offset, length) = bitmap.as_slice();
+        // safety: bitmap.as_slice adheres to the invariant
+        unsafe {
+            self.extend_from_slice_unchecked(slice, offset, length);
+        }
+    }
+
+    /// Returns the slice of bytes of this [`MutableBitmap`].
+    /// Note that the last byte may not be fully used.
+    #[inline]
+    pub fn as_slice(&self) -> &[u8] {
+        let len = (self.length).saturating_add(7) / 8;
+        &self.buffer[..len]
+    }
+}
+
+impl Default for MutableBitmap {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl<'a> IntoIterator for &'a MutableBitmap {
+    type Item = bool;
+    type IntoIter = BitmapIter<'a>;
+
+    fn into_iter(self) -> Self::IntoIter {
+        BitmapIter::<'a>::new(&self.buffer, 0, self.length)
+    }
+}
diff --git a/crates/nano-arrow/src/bitmap/utils/chunk_iterator/chunks_exact.rs b/crates/nano-arrow/src/bitmap/utils/chunk_iterator/chunks_exact.rs
new file mode 100644
index 000000000000..4ab9d300ba02
--- /dev/null
+++ b/crates/nano-arrow/src/bitmap/utils/chunk_iterator/chunks_exact.rs
@@ -0,0 +1,101 @@
+use std::convert::TryInto;
+use std::slice::ChunksExact;
+
+use super::{BitChunk, BitChunkIterExact};
+use crate::trusted_len::TrustedLen;
+
+/// An iterator over a slice of bytes in [`BitChunk`]s.
+#[derive(Debug)]
+pub struct BitChunksExact<'a, T: BitChunk> {
+    iter: ChunksExact<'a, u8>,
+    remainder: &'a [u8],
+    remainder_len: usize,
+    phantom: std::marker::PhantomData<T>,
+}
+
+impl<'a, T: BitChunk> BitChunksExact<'a, T> {
+    /// Creates a new [`BitChunksExact`].
+    #[inline]
+    pub fn new(bitmap: &'a [u8], length: usize) -> Self {
+        assert!(length <= bitmap.len() * 8);
+        let size_of = std::mem::size_of::<T>();
+
+        let bitmap = &bitmap[..length.saturating_add(7) / 8];
+
+        let split = (length / 8 / size_of) * size_of;
+        let (chunks, remainder) = bitmap.split_at(split);
+        let remainder_len = length - chunks.len() * 8;
+        let iter = chunks.chunks_exact(size_of);
+
+        Self {
+            iter,
+            remainder,
+            remainder_len,
+            phantom: std::marker::PhantomData,
+        }
+    }
+
+    /// Returns the number of chunks of this iterator
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.iter.len()
+    }
+
+    /// Returns whether there are still elements in this iterator
+    #[inline]
+    pub fn is_empty(&self) -> bool {
+        self.len() == 0
+    }
+
+    /// Returns the remaining [`BitChunk`]. It is zero iff `len / 8 == 0`.
+    #[inline]
+    pub fn remainder(&self) -> T {
+        let remainder_bytes = self.remainder;
+        if remainder_bytes.is_empty() {
+            return T::zero();
+        }
+        let remainder = match remainder_bytes.try_into() {
+            Ok(a) => a,
+            Err(_) => {
+                let mut remainder = T::zero().to_ne_bytes();
+                remainder_bytes
+                    .iter()
+                    .enumerate()
+                    .for_each(|(index, b)| remainder[index] = *b);
+                remainder
+            },
+        };
+        T::from_ne_bytes(remainder)
+    }
+}
+
+impl<T: BitChunk> Iterator for BitChunksExact<'_, T> {
+    type Item = T;
+
+    #[inline]
+    fn next(&mut self) -> Option<Self::Item> {
+        self.iter.next().map(|x| match x.try_into() {
+            Ok(a) => T::from_ne_bytes(a),
+            Err(_) => unreachable!(),
+        })
+    }
+
+    #[inline]
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        self.iter.size_hint()
+    }
+}
+
+unsafe impl<T: BitChunk> TrustedLen for BitChunksExact<'_, T> {}
+
+impl<T: BitChunk> BitChunkIterExact<T> for BitChunksExact<'_, T> {
+    #[inline]
+    fn remainder(&self) -> T {
+        self.remainder()
+    }
+
+    #[inline]
+    fn remainder_len(&self) -> usize {
+        self.remainder_len
+    }
+}
diff --git a/crates/nano-arrow/src/bitmap/utils/chunk_iterator/merge.rs b/crates/nano-arrow/src/bitmap/utils/chunk_iterator/merge.rs
new file mode 100644
index 000000000000..81e08df0059e
--- /dev/null
+++ b/crates/nano-arrow/src/bitmap/utils/chunk_iterator/merge.rs
@@ -0,0 +1,61 @@
+use super::BitChunk;
+
+/// Merges 2 [`BitChunk`]s into a single [`BitChunk`] so that the new items represents
+/// the bitmap where bits from `next` are placed in `current` according to `offset`.
+/// # Panic
+/// The caller must ensure that `0 < offset < size_of::<T>() * 8`
+/// # Example
+/// ```rust,ignore
+/// let current = 0b01011001;
+/// let next    = 0b01011011;
+/// let result = merge_reversed(current, next, 1);
+/// assert_eq!(result, 0b10101100);
+/// ```
+#[inline]
+pub fn merge_reversed<T>(mut current: T, mut next: T, offset: usize) -> T
+where
+    T: BitChunk,
+{
+    // 8 _bits_:
+    // current = [c0, c1, c2, c3, c4, c5, c6, c7]
+    // next =    [n0, n1, n2, n3, n4, n5, n6, n7]
+    // offset = 3
+    // expected = [n5, n6, n7, c0, c1, c2, c3, c4]
+
+    // 1. unset most significants of `next` up to `offset`
+    let inverse_offset = std::mem::size_of::<T>() * 8 - offset;
+    next <<= inverse_offset;
+    // next    =  [n5, n6, n7, 0 , 0 , 0 , 0 , 0 ]
+
+    // 2. unset least significants of `current` up to `offset`
+    current >>= offset;
+    // current =  [0 , 0 , 0 , c0, c1, c2, c3, c4]
+
+    current | next
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn test_merge_reversed() {
+        let current = 0b00000000;
+        let next = 0b00000001;
+        let result = merge_reversed::<u8>(current, next, 1);
+        assert_eq!(result, 0b10000000);
+
+        let current = 0b01011001;
+        let next = 0b01011011;
+        let result = merge_reversed::<u8>(current, next, 1);
+        assert_eq!(result, 0b10101100);
+    }
+
+    #[test]
+    fn test_merge_reversed_offset2() {
+        let current = 0b00000000;
+        let next = 0b00000001;
+        let result = merge_reversed::<u8>(current, next, 3);
+        assert_eq!(result, 0b00100000);
+    }
+}
diff --git a/crates/nano-arrow/src/bitmap/utils/chunk_iterator/mod.rs b/crates/nano-arrow/src/bitmap/utils/chunk_iterator/mod.rs
new file mode 100644
index 000000000000..71f56a284274
--- /dev/null
+++ b/crates/nano-arrow/src/bitmap/utils/chunk_iterator/mod.rs
@@ -0,0 +1,206 @@
+use std::convert::TryInto;
+
+mod chunks_exact;
+mod merge;
+
+pub use chunks_exact::BitChunksExact;
+pub(crate) use merge::merge_reversed;
+
+use crate::trusted_len::TrustedLen;
+pub use crate::types::BitChunk;
+use crate::types::BitChunkIter;
+
+/// Trait representing an exact iterator over bytes in [`BitChunk`].
+pub trait BitChunkIterExact<B: BitChunk>: TrustedLen<Item = B> {
+    /// The remainder of the iterator.
+    fn remainder(&self) -> B;
+
+    /// The number of items in the remainder
+    fn remainder_len(&self) -> usize;
+
+    /// An iterator over individual items of the remainder
+    #[inline]
+    fn remainder_iter(&self) -> BitChunkIter<B> {
+        BitChunkIter::new(self.remainder(), self.remainder_len())
+    }
+}
+
+/// This struct is used to efficiently iterate over bit masks by loading bytes on
+/// the stack with alignments of `uX`. This allows efficient iteration over bitmaps.
+#[derive(Debug)]
+pub struct BitChunks<'a, T: BitChunk> {
+    chunk_iterator: std::slice::ChunksExact<'a, u8>,
+    current: T,
+    remainder_bytes: &'a [u8],
+    last_chunk: T,
+    remaining: usize,
+    /// offset inside a byte
+    bit_offset: usize,
+    len: usize,
+    phantom: std::marker::PhantomData<T>,
+}
+
+/// writes `bytes` into `dst`.
+#[inline]
+fn copy_with_merge<T: BitChunk>(dst: &mut T::Bytes, bytes: &[u8], bit_offset: usize) {
+    bytes
+        .windows(2)
+        .chain(std::iter::once([bytes[bytes.len() - 1], 0].as_ref()))
+        .take(std::mem::size_of::<T>())
+        .enumerate()
+        .for_each(|(i, w)| {
+            let val = merge_reversed(w[0], w[1], bit_offset);
+            dst[i] = val;
+        });
+}
+
+impl<'a, T: BitChunk> BitChunks<'a, T> {
+    /// Creates a [`BitChunks`].
+    pub fn new(slice: &'a [u8], offset: usize, len: usize) -> Self {
+        assert!(offset + len <= slice.len() * 8);
+
+        let slice = &slice[offset / 8..];
+        let bit_offset = offset % 8;
+        let size_of = std::mem::size_of::<T>();
+
+        let bytes_len = len / 8;
+        let bytes_upper_len = (len + bit_offset + 7) / 8;
+        let mut chunks = slice[..bytes_len].chunks_exact(size_of);
+
+        let remainder = &slice[bytes_len - chunks.remainder().len()..bytes_upper_len];
+
+        let remainder_bytes = if chunks.len() == 0 { slice } else { remainder };
+
+        let last_chunk = remainder_bytes
+            .first()
+            .map(|first| {
+                let mut last = T::zero().to_ne_bytes();
+                last[0] = *first;
+                T::from_ne_bytes(last)
+            })
+            .unwrap_or_else(T::zero);
+
+        let remaining = chunks.size_hint().0;
+
+        let current = chunks
+            .next()
+            .map(|x| match x.try_into() {
+                Ok(a) => T::from_ne_bytes(a),
+                Err(_) => unreachable!(),
+            })
+            .unwrap_or_else(T::zero);
+
+        Self {
+            chunk_iterator: chunks,
+            len,
+            current,
+            remaining,
+            remainder_bytes,
+            last_chunk,
+            bit_offset,
+            phantom: std::marker::PhantomData,
+        }
+    }
+
+    #[inline]
+    fn load_next(&mut self) {
+        self.current = match self.chunk_iterator.next().unwrap().try_into() {
+            Ok(a) => T::from_ne_bytes(a),
+            Err(_) => unreachable!(),
+        };
+    }
+
+    /// Returns the remainder [`BitChunk`].
+    pub fn remainder(&self) -> T {
+        // remaining bytes may not fit in `size_of::<T>()`. We complement
+        // them to fit by allocating T and writing to it byte by byte
+        let mut remainder = T::zero().to_ne_bytes();
+
+        let remainder = match (self.remainder_bytes.is_empty(), self.bit_offset == 0) {
+            (true, _) => remainder,
+            (false, true) => {
+                // all remaining bytes
+                self.remainder_bytes
+                    .iter()
+                    .take(std::mem::size_of::<T>())
+                    .enumerate()
+                    .for_each(|(i, val)| remainder[i] = *val);
+
+                remainder
+            },
+            (false, false) => {
+                // all remaining bytes
+                copy_with_merge::<T>(&mut remainder, self.remainder_bytes, self.bit_offset);
+                remainder
+            },
+        };
+        T::from_ne_bytes(remainder)
+    }
+
+    /// Returns the remainder bits in [`BitChunks::remainder`].
+    pub fn remainder_len(&self) -> usize {
+        self.len - (std::mem::size_of::<T>() * ((self.len / 8) / std::mem::size_of::<T>()) * 8)
+    }
+}
+
+impl<T: BitChunk> Iterator for BitChunks<'_, T> {
+    type Item = T;
+
+    #[inline]
+    fn next(&mut self) -> Option<T> {
+        if self.remaining == 0 {
+            return None;
+        }
+
+        let current = self.current;
+        let combined = if self.bit_offset == 0 {
+            // fast case where there is no offset. In this case, there is bit-alignment
+            // at byte boundary and thus the bytes correspond exactly.
+            if self.remaining >= 2 {
+                self.load_next();
+            }
+            current
+        } else {
+            let next = if self.remaining >= 2 {
+                // case where `next` is complete and thus we can take it all
+                self.load_next();
+                self.current
+            } else {
+                // case where the `next` is incomplete and thus we take the remaining
+                self.last_chunk
+            };
+            merge_reversed(current, next, self.bit_offset)
+        };
+
+        self.remaining -= 1;
+        Some(combined)
+    }
+
+    #[inline]
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        // it contains always one more than the chunk_iterator, which is the last
+        // one where the remainder is merged into current.
+        (self.remaining, Some(self.remaining))
+    }
+}
+
+impl<T: BitChunk> BitChunkIterExact<T> for BitChunks<'_, T> {
+    #[inline]
+    fn remainder(&self) -> T {
+        self.remainder()
+    }
+
+    #[inline]
+    fn remainder_len(&self) -> usize {
+        self.remainder_len()
+    }
+}
+
+impl<T: BitChunk> ExactSizeIterator for BitChunks<'_, T> {
+    #[inline]
+    fn len(&self) -> usize {
+        self.chunk_iterator.len()
+    }
+}
+
+unsafe impl<T: BitChunk> TrustedLen for BitChunks<'_, T> {}
diff --git a/crates/nano-arrow/src/bitmap/utils/chunks_exact_mut.rs b/crates/nano-arrow/src/bitmap/utils/chunks_exact_mut.rs
new file mode 100644
index 000000000000..7a5a91a12805
--- /dev/null
+++ b/crates/nano-arrow/src/bitmap/utils/chunks_exact_mut.rs
@@ -0,0 +1,63 @@
+use super::BitChunk;
+
+/// An iterator over mutable slices of bytes of exact size.
+///
+/// # Safety
+/// The slices returned by this iterator are guaranteed to have length equal to
+/// `std::mem::size_of::<T>()`.
+#[derive(Debug)]
+pub struct BitChunksExactMut<'a, T: BitChunk> {
+    chunks: std::slice::ChunksExactMut<'a, u8>,
+    remainder: &'a mut [u8],
+    remainder_len: usize,
+    marker: std::marker::PhantomData<T>,
+}
+
+impl<'a, T: BitChunk> BitChunksExactMut<'a, T> {
+    /// Returns a new [`BitChunksExactMut`]
+    #[inline]
+    pub fn new(bitmap: &'a mut [u8], length: usize) -> Self {
+        assert!(length <= bitmap.len() * 8);
+        let size_of = std::mem::size_of::<T>();
+
+        let bitmap = &mut bitmap[..length.saturating_add(7) / 8];
+
+        let split = (length / 8 / size_of) * size_of;
+        let (chunks, remainder) = bitmap.split_at_mut(split);
+        let remainder_len = length - chunks.len() * 8;
+
+        let chunks = chunks.chunks_exact_mut(size_of);
+        Self {
+            chunks,
+            remainder,
+            remainder_len,
+            marker: std::marker::PhantomData,
+        }
+    }
+
+    /// The remainder slice
+    #[inline]
+    pub fn remainder(&mut self) -> &mut [u8] {
+        self.remainder
+    }
+
+    /// The length of the remainder slice in bits.
+    #[inline]
+    pub fn remainder_len(&mut self) -> usize {
+        self.remainder_len
+    }
+}
+
+impl<'a, T: BitChunk> Iterator for BitChunksExactMut<'a, T> {
+    type Item = &'a mut [u8];
+
+    #[inline]
+    fn next(&mut self) -> Option<Self::Item> {
+        self.chunks.next()
+    }
+
+    #[inline]
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        self.chunks.size_hint()
+    }
+}
diff --git a/crates/nano-arrow/src/bitmap/utils/fmt.rs b/crates/nano-arrow/src/bitmap/utils/fmt.rs
new file mode 100644
index 000000000000..45fe9ec9ced3
--- /dev/null
+++ b/crates/nano-arrow/src/bitmap/utils/fmt.rs
@@ -0,0 +1,72 @@
+use std::fmt::Write;
+
+use super::is_set;
+
+/// Formats `bytes` taking into account an offset and length of the form
+pub fn fmt(
+    bytes: &[u8],
+    offset: usize,
+    length: usize,
+    f: &mut std::fmt::Formatter<'_>,
+) -> std::fmt::Result {
+    assert!(offset < 8);
+
+    f.write_char('[')?;
+    let mut remaining = length;
+    if remaining == 0 {
+        f.write_char(']')?;
+        return Ok(());
+    }
+
+    let first = bytes[0];
+    let bytes = &bytes[1..];
+    let empty_before = 8usize.saturating_sub(remaining + offset);
+    f.write_str("0b")?;
+    for _ in 0..empty_before {
+        f.write_char('_')?;
+    }
+    let until = std::cmp::min(8, offset + remaining);
+    for i in offset..until {
+        if is_set(first, offset + until - 1 - i) {
+            f.write_char('1')?;
+        } else {
+            f.write_char('0')?;
+        }
+    }
+    for _ in 0..offset {
+        f.write_char('_')?;
+    }
+    remaining -= until - offset;
+
+    if remaining == 0 {
+        f.write_char(']')?;
+        return Ok(());
+    }
+
+    let number_of_bytes = remaining / 8;
+    for byte in &bytes[..number_of_bytes] {
+        f.write_str(", ")?;
+        f.write_fmt(format_args!("{byte:#010b}"))?;
+    }
+    remaining -= number_of_bytes * 8;
+    if remaining == 0 {
+        f.write_char(']')?;
+        return Ok(());
+    }
+
+    let last = bytes[std::cmp::min((length + offset + 7) / 8, bytes.len() - 1)];
+    let remaining = (length + offset) % 8;
+    f.write_str(", ")?;
+    f.write_str("0b")?;
+    for _ in 0..(8 - remaining) {
+        f.write_char('_')?;
+    }
+    for i in 0..remaining {
+        if is_set(last, remaining - 1 - i) {
+            f.write_char('1')?;
+        } else {
+            f.write_char('0')?;
+        }
+    }
+    f.write_char(']')
+}
diff --git a/crates/nano-arrow/src/bitmap/utils/iterator.rs b/crates/nano-arrow/src/bitmap/utils/iterator.rs
new file mode 100644
index 000000000000..1a35ad56b562
--- /dev/null
+++ b/crates/nano-arrow/src/bitmap/utils/iterator.rs
@@ -0,0 +1,82 @@
+use super::get_bit_unchecked;
+use crate::trusted_len::TrustedLen;
+
+/// An iterator over bits according to the [LSB](https://en.wikipedia.org/wiki/Bit_numbering#Least_significant_bit),
+/// i.e. the bytes `[4u8, 128u8]` correspond to `[false, false, true, false, ..., true]`.
+#[derive(Debug, Clone)]
+pub struct BitmapIter<'a> {
+    bytes: &'a [u8],
+    index: usize,
+    end: usize,
+}
+
+impl<'a> BitmapIter<'a> {
+    /// Creates a new [`BitmapIter`].
+    pub fn new(slice: &'a [u8], offset: usize, len: usize) -> Self {
+        // example:
+        // slice.len() = 4
+        // offset = 9
+        // len = 23
+        // result:
+        let bytes = &slice[offset / 8..];
+        // bytes.len() = 3
+        let index = offset % 8;
+        // index = 9 % 8 = 1
+        let end = len + index;
+        // end = 23 + 1 = 24
+        assert!(end <= bytes.len() * 8);
+        // maximum read before UB in bits: bytes.len() * 8 = 24
+        // the first read from the end is `end - 1`, thus, end = 24 is ok
+
+        Self { bytes, index, end }
+    }
+}
+
+impl<'a> Iterator for BitmapIter<'a> {
+    type Item = bool;
+
+    #[inline]
+    fn next(&mut self) -> Option<Self::Item> {
+        if self.index == self.end {
+            return None;
+        }
+        let old = self.index;
+        self.index += 1;
+        // See comment in `new`
+        Some(unsafe { get_bit_unchecked(self.bytes, old) })
+    }
+
+    #[inline]
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        let exact = self.end - self.index;
+        (exact, Some(exact))
+    }
+
+    #[inline]
+    fn nth(&mut self, n: usize) -> Option<Self::Item> {
+        let new_index = self.index + n;
+        if new_index > self.end {
+            self.index = self.end;
+            None
+        } else {
+            self.index = new_index;
+            self.next()
+        }
+    }
+}
+
+impl<'a> DoubleEndedIterator for BitmapIter<'a> {
+    #[inline]
+    fn next_back(&mut self) -> Option<bool> {
+        if self.index == self.end {
+            None
+        } else {
+            self.end -= 1;
+            // See comment in `new`; end was first decreased
+            Some(unsafe { get_bit_unchecked(self.bytes, self.end) })
+        }
+    }
+}
+
+unsafe impl TrustedLen for BitmapIter<'_> {}
+impl ExactSizeIterator for BitmapIter<'_> {}
diff --git a/crates/nano-arrow/src/bitmap/utils/mod.rs b/crates/nano-arrow/src/bitmap/utils/mod.rs
new file mode 100644
index 000000000000..b064ffd8bed7
--- /dev/null
+++ b/crates/nano-arrow/src/bitmap/utils/mod.rs
@@ -0,0 +1,143 @@
+//! General utilities for bitmaps representing items where LSB is the first item.
+mod chunk_iterator;
+mod chunks_exact_mut;
+mod fmt;
+mod iterator;
+mod slice_iterator;
+mod zip_validity;
+
+use std::convert::TryInto;
+
+pub(crate) use chunk_iterator::merge_reversed;
+pub use chunk_iterator::{BitChunk, BitChunkIterExact, BitChunks, BitChunksExact};
+pub use chunks_exact_mut::BitChunksExactMut;
+pub use fmt::fmt;
+pub use iterator::BitmapIter;
+pub use slice_iterator::SlicesIterator;
+pub use zip_validity::{ZipValidity, ZipValidityIter};
+
+const BIT_MASK: [u8; 8] = [1, 2, 4, 8, 16, 32, 64, 128];
+const UNSET_BIT_MASK: [u8; 8] = [
+    255 - 1,
+    255 - 2,
+    255 - 4,
+    255 - 8,
+    255 - 16,
+    255 - 32,
+    255 - 64,
+    255 - 128,
+];
+
+/// Returns whether bit at position `i` in `byte` is set or not
+#[inline]
+pub fn is_set(byte: u8, i: usize) -> bool {
+    (byte & BIT_MASK[i]) != 0
+}
+
+/// Sets bit at position `i` in `byte`
+#[inline]
+pub fn set(byte: u8, i: usize, value: bool) -> u8 {
+    if value {
+        byte | BIT_MASK[i]
+    } else {
+        byte & UNSET_BIT_MASK[i]
+    }
+}
+
+/// Sets bit at position `i` in `data`
+/// # Panics
+/// panics if `i >= data.len() / 8`
+#[inline]
+pub fn set_bit(data: &mut [u8], i: usize, value: bool) {
+    data[i / 8] = set(data[i / 8], i % 8, value);
+}
+
+/// Sets bit at position `i` in `data` without doing bound checks
+/// # Safety
+/// caller must ensure that `i < data.len() / 8`
+#[inline]
+pub unsafe fn set_bit_unchecked(data: &mut [u8], i: usize, value: bool) {
+    let byte = data.get_unchecked_mut(i / 8);
+    *byte = set(*byte, i % 8, value);
+}
+
+/// Returns whether bit at position `i` in `data` is set
+/// # Panic
+/// This function panics iff `i / 8 >= bytes.len()`
+#[inline]
+pub fn get_bit(bytes: &[u8], i: usize) -> bool {
+    is_set(bytes[i / 8], i % 8)
+}
+
+/// Returns whether bit at position `i` in `data` is set or not.
+///
+/// # Safety
+/// `i >= data.len() * 8` results in undefined behavior
+#[inline]
+pub unsafe fn get_bit_unchecked(data: &[u8], i: usize) -> bool {
+    (*data.as_ptr().add(i >> 3) & BIT_MASK[i & 7]) != 0
+}
+
+/// Returns the number of bytes required to hold `bits` bits.
+#[inline]
+pub fn bytes_for(bits: usize) -> usize {
+    bits.saturating_add(7) / 8
+}
+
+/// Returns the number of zero bits in the slice offsetted by `offset` and a length of `length`.
+/// # Panics
+/// This function panics iff `(offset + len).saturating_add(7) / 8 >= slice.len()`
+/// because it corresponds to the situation where `len` is beyond bounds.
+pub fn count_zeros(slice: &[u8], offset: usize, len: usize) -> usize {
+    if len == 0 {
+        return 0;
+    };
+
+    let mut slice = &slice[offset / 8..(offset + len).saturating_add(7) / 8];
+    let offset = offset % 8;
+
+    if (offset + len) / 8 == 0 {
+        // all within a single byte
+        let byte = (slice[0] >> offset) << (8 - len);
+        return len - byte.count_ones() as usize;
+    }
+
+    // slice: [a1,a2,a3,a4], [a5,a6,a7,a8]
+    // offset: 3
+    // len: 4
+    // [__,__,__,a4], [a5,a6,a7,__]
+    let mut set_count = 0;
+    if offset != 0 {
+        // count all ignoring the first `offset` bits
+        // i.e. [__,__,__,a4]
+        set_count += (slice[0] >> offset).count_ones() as usize;
+        slice = &slice[1..];
+    }
+    if (offset + len) % 8 != 0 {
+        let end_offset = (offset + len) % 8; // i.e. 3 + 4 = 7
+        let last_index = slice.len() - 1;
+        // count all ignoring the last `offset` bits
+        // i.e. [a5,a6,a7,__]
+        set_count += (slice[last_index] << (8 - end_offset)).count_ones() as usize;
+        slice = &slice[..last_index];
+    }
+
+    // finally, count any and all bytes in the middle in groups of 8
+    let mut chunks = slice.chunks_exact(8);
+    set_count += chunks
+        .by_ref()
+        .map(|chunk| {
+            let a = u64::from_ne_bytes(chunk.try_into().unwrap());
+            a.count_ones() as usize
+        })
+        .sum::<usize>();
+
+    // and any bytes that do not fit in the group
+    set_count += chunks
+        .remainder()
+        .iter()
+        .map(|byte| byte.count_ones() as usize)
+        .sum::<usize>();
+
+    len - set_count
+}
diff --git a/crates/nano-arrow/src/bitmap/utils/slice_iterator.rs b/crates/nano-arrow/src/bitmap/utils/slice_iterator.rs
new file mode 100644
index 000000000000..dc388f1d41b5
--- /dev/null
+++ b/crates/nano-arrow/src/bitmap/utils/slice_iterator.rs
@@ -0,0 +1,145 @@
+use crate::bitmap::Bitmap;
+
+/// Internal state of [`SlicesIterator`]
+#[derive(Debug, Clone, PartialEq)]
+enum State {
+    // normal iteration
+    Nominal,
+    // nothing more to iterate.
+    Finished,
+}
+
+/// Iterator over a bitmap that returns slices of set regions
+/// This is the most efficient method to extract slices of values from arrays
+/// with a validity bitmap.
+/// For example, the bitmap `00101111` returns `[(0,4), (6,1)]`
+#[derive(Debug, Clone)]
+pub struct SlicesIterator<'a> {
+    values: std::slice::Iter<'a, u8>,
+    count: usize,
+    mask: u8,
+    max_len: usize,
+    current_byte: &'a u8,
+    state: State,
+    len: usize,
+    start: usize,
+    on_region: bool,
+}
+
+impl<'a> SlicesIterator<'a> {
+    /// Creates a new [`SlicesIterator`]
+    pub fn new(values: &'a Bitmap) -> Self {
+        let (buffer, offset, _) = values.as_slice();
+        let mut iter = buffer.iter();
+
+        let (current_byte, state) = match iter.next() {
+            Some(b) => (b, State::Nominal),
+            None => (&0, State::Finished),
+        };
+
+        Self {
+            state,
+            count: values.len() - values.unset_bits(),
+            max_len: values.len(),
+            values: iter,
+            mask: 1u8.rotate_left(offset as u32),
+            current_byte,
+            len: 0,
+            start: 0,
+            on_region: false,
+        }
+    }
+
+    #[inline]
+    fn finish(&mut self) -> Option<(usize, usize)> {
+        self.state = State::Finished;
+        if self.on_region {
+            Some((self.start, self.len))
+        } else {
+            None
+        }
+    }
+
+    #[inline]
+    fn current_len(&self) -> usize {
+        self.start + self.len
+    }
+
+    /// Returns the total number of slots.
+    /// It corresponds to the sum of all lengths of all slices.
+    #[inline]
+    pub fn slots(&self) -> usize {
+        self.count
+    }
+}
+
+impl<'a> Iterator for SlicesIterator<'a> {
+    type Item = (usize, usize);
+
+    #[inline]
+    fn next(&mut self) -> Option<Self::Item> {
+        loop {
+            if self.state == State::Finished {
+                return None;
+            }
+            if self.current_len() == self.max_len {
+                return self.finish();
+            }
+
+            if self.mask == 1 {
+                // at the beginning of a byte => try to skip it all together
+                match (self.on_region, self.current_byte) {
+                    (true, &255u8) => {
+                        self.len = std::cmp::min(self.max_len - self.start, self.len + 8);
+                        if let Some(v) = self.values.next() {
+                            self.current_byte = v;
+                        };
+                        continue;
+                    },
+                    (false, &0) => {
+                        self.len = std::cmp::min(self.max_len - self.start, self.len + 8);
+                        if let Some(v) = self.values.next() {
+                            self.current_byte = v;
+                        };
+                        continue;
+                    },
+                    _ => (), // we need to run over all bits of this byte
+                }
+            };
+
+            let value = (self.current_byte & self.mask) != 0;
+            self.mask = self.mask.rotate_left(1);
+
+            match (self.on_region, value) {
+                (true, true) => self.len += 1,
+                (false, false) => self.len += 1,
+                (true, false) => {
+                    self.on_region = false;
+                    let result = (self.start, self.len);
+                    self.start += self.len;
+                    self.len = 1;
+                    if self.mask == 1 {
+                        // reached a new byte => try to fetch it from the iterator
+                        if let Some(v) = self.values.next() {
+                            self.current_byte = v;
+                        };
+                    }
+                    return Some(result);
+                },
+                (false, true) => {
+                    self.start += self.len;
+                    self.len = 1;
+                    self.on_region = true;
+                },
+            }
+
+            if self.mask == 1 {
+                // reached a new byte => try to fetch it from the iterator
+                match self.values.next() {
+                    Some(v) => self.current_byte = v,
+                    None => return self.finish(),
+                };
+            }
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/bitmap/utils/zip_validity.rs b/crates/nano-arrow/src/bitmap/utils/zip_validity.rs
new file mode 100644
index 000000000000..40965bab4113
--- /dev/null
+++ b/crates/nano-arrow/src/bitmap/utils/zip_validity.rs
@@ -0,0 +1,216 @@
+use crate::bitmap::utils::BitmapIter;
+use crate::bitmap::Bitmap;
+use crate::trusted_len::TrustedLen;
+
+/// An [`Iterator`] over validity and values.
+#[derive(Debug, Clone)]
+pub struct ZipValidityIter<T, I, V>
+where
+    I: Iterator<Item = T>,
+    V: Iterator<Item = bool>,
+{
+    values: I,
+    validity: V,
+}
+
+impl<T, I, V> ZipValidityIter<T, I, V>
+where
+    I: Iterator<Item = T>,
+    V: Iterator<Item = bool>,
+{
+    /// Creates a new [`ZipValidityIter`].
+    /// # Panics
+    /// This function panics if the size_hints of the iterators are different
+    pub fn new(values: I, validity: V) -> Self {
+        assert_eq!(values.size_hint(), validity.size_hint());
+        Self { values, validity }
+    }
+}
+
+impl<T, I, V> Iterator for ZipValidityIter<T, I, V>
+where
+    I: Iterator<Item = T>,
+    V: Iterator<Item = bool>,
+{
+    type Item = Option<T>;
+
+    #[inline]
+    fn next(&mut self) -> Option<Self::Item> {
+        let value = self.values.next();
+        let is_valid = self.validity.next();
+        is_valid
+            .zip(value)
+            .map(|(is_valid, value)| is_valid.then(|| value))
+    }
+
+    #[inline]
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        self.values.size_hint()
+    }
+
+    #[inline]
+    fn nth(&mut self, n: usize) -> Option<Self::Item> {
+        let value = self.values.nth(n);
+        let is_valid = self.validity.nth(n);
+        is_valid
+            .zip(value)
+            .map(|(is_valid, value)| is_valid.then(|| value))
+    }
+}
+
+impl<T, I, V> DoubleEndedIterator for ZipValidityIter<T, I, V>
+where
+    I: DoubleEndedIterator<Item = T>,
+    V: DoubleEndedIterator<Item = bool>,
+{
+    #[inline]
+    fn next_back(&mut self) -> Option<Self::Item> {
+        let value = self.values.next_back();
+        let is_valid = self.validity.next_back();
+        is_valid
+            .zip(value)
+            .map(|(is_valid, value)| is_valid.then(|| value))
+    }
+}
+
+unsafe impl<T, I, V> TrustedLen for ZipValidityIter<T, I, V>
+where
+    I: TrustedLen<Item = T>,
+    V: TrustedLen<Item = bool>,
+{
+}
+
+impl<T, I, V> ExactSizeIterator for ZipValidityIter<T, I, V>
+where
+    I: ExactSizeIterator<Item = T>,
+    V: ExactSizeIterator<Item = bool>,
+{
+}
+
+/// An [`Iterator`] over [`Option<T>`]
+/// This enum can be used in two distinct ways:
+/// * as an iterator, via `Iterator::next`
+/// * as an enum of two iterators, via `match self`
+/// The latter allows specializalizing to when there are no nulls
+#[derive(Debug, Clone)]
+pub enum ZipValidity<T, I, V>
+where
+    I: Iterator<Item = T>,
+    V: Iterator<Item = bool>,
+{
+    /// There are no null values
+    Required(I),
+    /// There are null values
+    Optional(ZipValidityIter<T, I, V>),
+}
+
+impl<T, I, V> ZipValidity<T, I, V>
+where
+    I: Iterator<Item = T>,
+    V: Iterator<Item = bool>,
+{
+    /// Returns a new [`ZipValidity`]
+    pub fn new(values: I, validity: Option<V>) -> Self {
+        match validity {
+            Some(validity) => Self::Optional(ZipValidityIter::new(values, validity)),
+            _ => Self::Required(values),
+        }
+    }
+}
+
+impl<'a, T, I> ZipValidity<T, I, BitmapIter<'a>>
+where
+    I: Iterator<Item = T>,
+{
+    /// Returns a new [`ZipValidity`] and drops the `validity` if all values
+    /// are valid.
+    pub fn new_with_validity(values: I, validity: Option<&'a Bitmap>) -> Self {
+        // only if the validity has nulls we take the optional branch.
+        match validity.and_then(|validity| (validity.unset_bits() > 0).then(|| validity.iter())) {
+            Some(validity) => Self::Optional(ZipValidityIter::new(values, validity)),
+            _ => Self::Required(values),
+        }
+    }
+}
+
+impl<T, I, V> Iterator for ZipValidity<T, I, V>
+where
+    I: Iterator<Item = T>,
+    V: Iterator<Item = bool>,
+{
+    type Item = Option<T>;
+
+    #[inline]
+    fn next(&mut self) -> Option<Self::Item> {
+        match self {
+            Self::Required(values) => values.next().map(Some),
+            Self::Optional(zipped) => zipped.next(),
+        }
+    }
+
+    #[inline]
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        match self {
+            Self::Required(values) => values.size_hint(),
+            Self::Optional(zipped) => zipped.size_hint(),
+        }
+    }
+
+    #[inline]
+    fn nth(&mut self, n: usize) -> Option<Self::Item> {
+        match self {
+            Self::Required(values) => values.nth(n).map(Some),
+            Self::Optional(zipped) => zipped.nth(n),
+        }
+    }
+}
+
+impl<T, I, V> DoubleEndedIterator for ZipValidity<T, I, V>
+where
+    I: DoubleEndedIterator<Item = T>,
+    V: DoubleEndedIterator<Item = bool>,
+{
+    #[inline]
+    fn next_back(&mut self) -> Option<Self::Item> {
+        match self {
+            Self::Required(values) => values.next_back().map(Some),
+            Self::Optional(zipped) => zipped.next_back(),
+        }
+    }
+}
+
+impl<T, I, V> ExactSizeIterator for ZipValidity<T, I, V>
+where
+    I: ExactSizeIterator<Item = T>,
+    V: ExactSizeIterator<Item = bool>,
+{
+}
+
+unsafe impl<T, I, V> TrustedLen for ZipValidity<T, I, V>
+where
+    I: TrustedLen<Item = T>,
+    V: TrustedLen<Item = bool>,
+{
+}
+
+impl<T, I, V> ZipValidity<T, I, V>
+where
+    I: Iterator<Item = T>,
+    V: Iterator<Item = bool>,
+{
+    /// Unwrap into an iterator that has no null values.
+    pub fn unwrap_required(self) -> I {
+        match self {
+            ZipValidity::Required(i) => i,
+            _ => panic!("Could not 'unwrap_required'. 'ZipValidity' iterator has nulls."),
+        }
+    }
+
+    /// Unwrap into an iterator that has null values.
+    pub fn unwrap_optional(self) -> ZipValidityIter<T, I, V> {
+        match self {
+            ZipValidity::Optional(i) => i,
+            _ => panic!("Could not 'unwrap_optional'. 'ZipValidity' iterator has no nulls."),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/buffer/immutable.rs b/crates/nano-arrow/src/buffer/immutable.rs
new file mode 100644
index 000000000000..b9b87336b359
--- /dev/null
+++ b/crates/nano-arrow/src/buffer/immutable.rs
@@ -0,0 +1,328 @@
+use std::iter::FromIterator;
+use std::ops::Deref;
+use std::sync::Arc;
+use std::usize;
+
+use either::Either;
+
+use super::{Bytes, IntoIter};
+
+/// [`Buffer`] is a contiguous memory region that can be shared across
+/// thread boundaries.
+///
+/// The easiest way to think about [`Buffer<T>`] is being equivalent to
+/// a `Arc<Vec<T>>`, with the following differences:
+/// * slicing and cloning is `O(1)`.
+/// * it supports external allocated memory
+///
+/// The easiest way to create one is to use its implementation of `From<Vec<T>>`.
+///
+/// # Examples
+/// ```
+/// use arrow2::buffer::Buffer;
+///
+/// let mut buffer: Buffer<u32> = vec![1, 2, 3].into();
+/// assert_eq!(buffer.as_ref(), [1, 2, 3].as_ref());
+///
+/// // it supports copy-on-write semantics (i.e. back to a `Vec`)
+/// let vec: Vec<u32> = buffer.into_mut().right().unwrap();
+/// assert_eq!(vec, vec![1, 2, 3]);
+///
+/// // cloning and slicing is `O(1)` (data is shared)
+/// let mut buffer: Buffer<u32> = vec![1, 2, 3].into();
+/// let mut sliced = buffer.clone();
+/// sliced.slice(1, 1);
+/// assert_eq!(sliced.as_ref(), [2].as_ref());
+/// // but cloning forbids getting mut since `slice` and `buffer` now share data
+/// assert_eq!(buffer.get_mut_slice(), None);
+/// ```
+#[derive(Clone)]
+pub struct Buffer<T> {
+    /// the internal byte buffer.
+    data: Arc<Bytes<T>>,
+
+    /// The offset into the buffer.
+    offset: usize,
+
+    // the length of the buffer. Given a region `data` of N bytes, [offset..offset+length] is visible
+    // to this buffer.
+    length: usize,
+}
+
+impl<T: PartialEq> PartialEq for Buffer<T> {
+    #[inline]
+    fn eq(&self, other: &Self) -> bool {
+        self.deref() == other.deref()
+    }
+}
+
+impl<T: std::fmt::Debug> std::fmt::Debug for Buffer<T> {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        std::fmt::Debug::fmt(&**self, f)
+    }
+}
+
+impl<T> Default for Buffer<T> {
+    #[inline]
+    fn default() -> Self {
+        Vec::new().into()
+    }
+}
+
+impl<T> Buffer<T> {
+    /// Creates an empty [`Buffer`].
+    #[inline]
+    pub fn new() -> Self {
+        Self::default()
+    }
+
+    /// Auxiliary method to create a new Buffer
+    pub(crate) fn from_bytes(bytes: Bytes<T>) -> Self {
+        let length = bytes.len();
+        Buffer {
+            data: Arc::new(bytes),
+            offset: 0,
+            length,
+        }
+    }
+
+    /// Returns the number of bytes in the buffer
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.length
+    }
+
+    /// Returns whether the buffer is empty.
+    #[inline]
+    pub fn is_empty(&self) -> bool {
+        self.len() == 0
+    }
+
+    /// Returns whether underlying data is sliced.
+    /// If sliced the [`Buffer`] is backed by
+    /// more data than the length of `Self`.
+    pub fn is_sliced(&self) -> bool {
+        self.data.len() != self.length
+    }
+
+    /// Returns the byte slice stored in this buffer
+    #[inline]
+    pub fn as_slice(&self) -> &[T] {
+        // Safety:
+        // invariant of this struct `offset + length <= data.len()`
+        debug_assert!(self.offset + self.length <= self.data.len());
+        unsafe {
+            self.data
+                .get_unchecked(self.offset..self.offset + self.length)
+        }
+    }
+
+    /// Returns the byte slice stored in this buffer
+    /// # Safety
+    /// `index` must be smaller than `len`
+    #[inline]
+    pub(super) unsafe fn get_unchecked(&self, index: usize) -> &T {
+        // Safety:
+        // invariant of this function
+        debug_assert!(index < self.length);
+        unsafe { self.data.get_unchecked(self.offset + index) }
+    }
+
+    /// Returns a new [`Buffer`] that is a slice of this buffer starting at `offset`.
+    /// Doing so allows the same memory region to be shared between buffers.
+    /// # Panics
+    /// Panics iff `offset + length` is larger than `len`.
+    #[inline]
+    pub fn sliced(self, offset: usize, length: usize) -> Self {
+        assert!(
+            offset + length <= self.len(),
+            "the offset of the new Buffer cannot exceed the existing length"
+        );
+        // Safety: we just checked bounds
+        unsafe { self.sliced_unchecked(offset, length) }
+    }
+
+    /// Slices this buffer starting at `offset`.
+    /// # Panics
+    /// Panics iff `offset` is larger than `len`.
+    #[inline]
+    pub fn slice(&mut self, offset: usize, length: usize) {
+        assert!(
+            offset + length <= self.len(),
+            "the offset of the new Buffer cannot exceed the existing length"
+        );
+        // Safety: we just checked bounds
+        unsafe { self.slice_unchecked(offset, length) }
+    }
+
+    /// Returns a new [`Buffer`] that is a slice of this buffer starting at `offset`.
+    /// Doing so allows the same memory region to be shared between buffers.
+    /// # Safety
+    /// The caller must ensure `offset + length <= self.len()`
+    #[inline]
+    #[must_use]
+    pub unsafe fn sliced_unchecked(mut self, offset: usize, length: usize) -> Self {
+        self.slice_unchecked(offset, length);
+        self
+    }
+
+    /// Slices this buffer starting at `offset`.
+    /// # Safety
+    /// The caller must ensure `offset + length <= self.len()`
+    #[inline]
+    pub unsafe fn slice_unchecked(&mut self, offset: usize, length: usize) {
+        self.offset += offset;
+        self.length = length;
+    }
+
+    /// Returns a pointer to the start of this buffer.
+    #[inline]
+    pub(crate) fn as_ptr(&self) -> *const T {
+        self.data.deref().as_ptr()
+    }
+
+    /// Returns the offset of this buffer.
+    #[inline]
+    pub fn offset(&self) -> usize {
+        self.offset
+    }
+
+    /// # Safety
+    /// The caller must ensure that the buffer was properly initialized up to `len`.
+    #[inline]
+    pub unsafe fn set_len(&mut self, len: usize) {
+        self.length = len;
+    }
+
+    /// Returns a mutable reference to its underlying [`Vec`], if possible.
+    ///
+    /// This operation returns [`Either::Right`] iff this [`Buffer`]:
+    /// * has not been cloned (i.e. [`Arc`]`::get_mut` yields [`Some`])
+    /// * has not been imported from the c data interface (FFI)
+    #[inline]
+    pub fn into_mut(mut self) -> Either<Self, Vec<T>> {
+        match Arc::get_mut(&mut self.data)
+            .and_then(|b| b.get_vec())
+            .map(std::mem::take)
+        {
+            Some(inner) => Either::Right(inner),
+            None => Either::Left(self),
+        }
+    }
+
+    /// Returns a mutable reference to its underlying `Vec`, if possible.
+    /// Note that only `[self.offset(), self.offset() + self.len()[` in this vector is visible
+    /// by this buffer.
+    ///
+    /// This operation returns [`Some`] iff this [`Buffer`]:
+    /// * has not been cloned (i.e. [`Arc`]`::get_mut` yields [`Some`])
+    /// * has not been imported from the c data interface (FFI)
+    /// # Safety
+    /// The caller must ensure that the vector in the mutable reference keeps a length of at least `self.offset() + self.len() - 1`.
+    #[inline]
+    pub unsafe fn get_mut(&mut self) -> Option<&mut Vec<T>> {
+        Arc::get_mut(&mut self.data).and_then(|b| b.get_vec())
+    }
+
+    /// Returns a mutable reference to its slice, if possible.
+    ///
+    /// This operation returns [`Some`] iff this [`Buffer`]:
+    /// * has not been cloned (i.e. [`Arc`]`::get_mut` yields [`Some`])
+    /// * has not been imported from the c data interface (FFI)
+    #[inline]
+    pub fn get_mut_slice(&mut self) -> Option<&mut [T]> {
+        Arc::get_mut(&mut self.data)
+            .and_then(|b| b.get_vec())
+            // Safety: the invariant of this struct
+            .map(|x| unsafe { x.get_unchecked_mut(self.offset..self.offset + self.length) })
+    }
+
+    /// Get the strong count of underlying `Arc` data buffer.
+    pub fn shared_count_strong(&self) -> usize {
+        Arc::strong_count(&self.data)
+    }
+
+    /// Get the weak count of underlying `Arc` data buffer.
+    pub fn shared_count_weak(&self) -> usize {
+        Arc::weak_count(&self.data)
+    }
+
+    /// Returns its internal representation
+    #[must_use]
+    pub fn into_inner(self) -> (Arc<Bytes<T>>, usize, usize) {
+        let Self {
+            data,
+            offset,
+            length,
+        } = self;
+        (data, offset, length)
+    }
+
+    /// Creates a `[Bitmap]` from its internal representation.
+    /// This is the inverted from `[Bitmap::into_inner]`
+    ///
+    /// # Safety
+    /// Callers must ensure all invariants of this struct are upheld.
+    pub unsafe fn from_inner_unchecked(data: Arc<Bytes<T>>, offset: usize, length: usize) -> Self {
+        Self {
+            data,
+            offset,
+            length,
+        }
+    }
+}
+
+impl<T> From<Vec<T>> for Buffer<T> {
+    #[inline]
+    fn from(p: Vec<T>) -> Self {
+        let bytes: Bytes<T> = p.into();
+        Self {
+            offset: 0,
+            length: bytes.len(),
+            data: Arc::new(bytes),
+        }
+    }
+}
+
+impl<T> std::ops::Deref for Buffer<T> {
+    type Target = [T];
+
+    #[inline]
+    fn deref(&self) -> &[T] {
+        self.as_slice()
+    }
+}
+
+impl<T> FromIterator<T> for Buffer<T> {
+    #[inline]
+    fn from_iter<I: IntoIterator<Item = T>>(iter: I) -> Self {
+        Vec::from_iter(iter).into()
+    }
+}
+
+impl<T: Copy> IntoIterator for Buffer<T> {
+    type Item = T;
+
+    type IntoIter = IntoIter<T>;
+
+    fn into_iter(self) -> Self::IntoIter {
+        IntoIter::new(self)
+    }
+}
+
+#[cfg(feature = "arrow")]
+impl<T: crate::types::NativeType> From<arrow_buffer::Buffer> for Buffer<T> {
+    fn from(value: arrow_buffer::Buffer) -> Self {
+        Self::from_bytes(crate::buffer::to_bytes(value))
+    }
+}
+
+#[cfg(feature = "arrow")]
+impl<T: crate::types::NativeType> From<Buffer<T>> for arrow_buffer::Buffer {
+    fn from(value: Buffer<T>) -> Self {
+        crate::buffer::to_buffer(value.data).slice_with_length(
+            value.offset * std::mem::size_of::<T>(),
+            value.length * std::mem::size_of::<T>(),
+        )
+    }
+}
diff --git a/crates/nano-arrow/src/buffer/iterator.rs b/crates/nano-arrow/src/buffer/iterator.rs
new file mode 100644
index 000000000000..93511c480284
--- /dev/null
+++ b/crates/nano-arrow/src/buffer/iterator.rs
@@ -0,0 +1,68 @@
+use super::Buffer;
+use crate::trusted_len::TrustedLen;
+
+/// This crates' equivalent of [`std::vec::IntoIter`] for [`Buffer`].
+#[derive(Debug, Clone)]
+pub struct IntoIter<T: Copy> {
+    values: Buffer<T>,
+    index: usize,
+    end: usize,
+}
+
+impl<T: Copy> IntoIter<T> {
+    /// Creates a new [`Buffer`]
+    #[inline]
+    pub fn new(values: Buffer<T>) -> Self {
+        let end = values.len();
+        Self {
+            values,
+            index: 0,
+            end,
+        }
+    }
+}
+
+impl<T: Copy> Iterator for IntoIter<T> {
+    type Item = T;
+
+    #[inline]
+    fn next(&mut self) -> Option<Self::Item> {
+        if self.index == self.end {
+            return None;
+        }
+        let old = self.index;
+        self.index += 1;
+        Some(*unsafe { self.values.get_unchecked(old) })
+    }
+
+    #[inline]
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        (self.end - self.index, Some(self.end - self.index))
+    }
+
+    #[inline]
+    fn nth(&mut self, n: usize) -> Option<Self::Item> {
+        let new_index = self.index + n;
+        if new_index > self.end {
+            self.index = self.end;
+            None
+        } else {
+            self.index = new_index;
+            self.next()
+        }
+    }
+}
+
+impl<T: Copy> DoubleEndedIterator for IntoIter<T> {
+    #[inline]
+    fn next_back(&mut self) -> Option<Self::Item> {
+        if self.index == self.end {
+            None
+        } else {
+            self.end -= 1;
+            Some(*unsafe { self.values.get_unchecked(self.end) })
+        }
+    }
+}
+
+unsafe impl<T: Copy> TrustedLen for IntoIter<T> {}
diff --git a/crates/nano-arrow/src/buffer/mod.rs b/crates/nano-arrow/src/buffer/mod.rs
new file mode 100644
index 000000000000..b75825d0ada1
--- /dev/null
+++ b/crates/nano-arrow/src/buffer/mod.rs
@@ -0,0 +1,96 @@
+//! Contains [`Buffer`], an immutable container for all Arrow physical types (e.g. i32, f64).
+
+mod immutable;
+mod iterator;
+
+use std::ops::Deref;
+
+use crate::ffi::InternalArrowArray;
+
+pub(crate) enum BytesAllocator {
+    InternalArrowArray(InternalArrowArray),
+
+    #[cfg(feature = "arrow")]
+    Arrow(arrow_buffer::Buffer),
+}
+pub(crate) type BytesInner<T> = foreign_vec::ForeignVec<BytesAllocator, T>;
+
+/// Bytes representation.
+#[repr(transparent)]
+pub struct Bytes<T>(BytesInner<T>);
+
+impl<T> Bytes<T> {
+    /// Takes ownership of an allocated memory region.
+    /// # Panics
+    /// This function panics if and only if pointer is not null
+    /// # Safety
+    /// This function is safe if and only if `ptr` is valid for `length`
+    /// # Implementation
+    /// This function leaks if and only if `owner` does not deallocate
+    /// the region `[ptr, ptr+length[` when dropped.
+    #[inline]
+    pub(crate) unsafe fn from_foreign(ptr: *const T, length: usize, owner: BytesAllocator) -> Self {
+        Self(BytesInner::from_foreign(ptr, length, owner))
+    }
+
+    /// Returns a `Some` mutable reference of [`Vec<T>`] iff this was initialized
+    /// from a [`Vec<T>`] and `None` otherwise.
+    #[inline]
+    pub(crate) fn get_vec(&mut self) -> Option<&mut Vec<T>> {
+        self.0.get_vec()
+    }
+}
+
+impl<T> Deref for Bytes<T> {
+    type Target = [T];
+
+    #[inline]
+    fn deref(&self) -> &Self::Target {
+        &self.0
+    }
+}
+
+impl<T> From<Vec<T>> for Bytes<T> {
+    #[inline]
+    fn from(data: Vec<T>) -> Self {
+        let inner: BytesInner<T> = data.into();
+        Bytes(inner)
+    }
+}
+
+impl<T> From<BytesInner<T>> for Bytes<T> {
+    #[inline]
+    fn from(value: BytesInner<T>) -> Self {
+        Self(value)
+    }
+}
+
+#[cfg(feature = "arrow")]
+pub(crate) fn to_buffer<T: crate::types::NativeType>(
+    value: std::sync::Arc<Bytes<T>>,
+) -> arrow_buffer::Buffer {
+    // This should never panic as ForeignVec pointer must be non-null
+    let ptr = std::ptr::NonNull::new(value.as_ptr() as _).unwrap();
+    let len = value.len() * std::mem::size_of::<T>();
+    // Safety: allocation is guaranteed to be valid for `len` bytes
+    unsafe { arrow_buffer::Buffer::from_custom_allocation(ptr, len, value) }
+}
+
+#[cfg(feature = "arrow")]
+pub(crate) fn to_bytes<T: crate::types::NativeType>(value: arrow_buffer::Buffer) -> Bytes<T> {
+    let ptr = value.as_ptr();
+    let align = ptr.align_offset(std::mem::align_of::<T>());
+    assert_eq!(align, 0, "not aligned");
+    let len = value.len() / std::mem::size_of::<T>();
+
+    // Valid as `NativeType: Pod` and checked alignment above
+    let ptr = value.as_ptr() as *const T;
+
+    let owner = crate::buffer::BytesAllocator::Arrow(value);
+
+    // Safety: slice is valid for len elements of T
+    unsafe { Bytes::from_foreign(ptr, len, owner) }
+}
+
+pub use immutable::Buffer;
+pub(super) use iterator::IntoIter;
diff --git a/crates/nano-arrow/src/chunk.rs b/crates/nano-arrow/src/chunk.rs
new file mode 100644
index 000000000000..ffc857bcc134
--- /dev/null
+++ b/crates/nano-arrow/src/chunk.rs
@@ -0,0 +1,84 @@
+//! Contains [`Chunk`], a container of [`Array`] where every array has the
+//! same length.
+
+use crate::array::Array;
+use crate::error::{Error, Result};
+
+/// A vector of trait objects of [`Array`] where every item has
+/// the same length, [`Chunk::len`].
+#[derive(Debug, Clone, PartialEq, Eq)]
+pub struct Chunk<A: AsRef<dyn Array>> {
+    arrays: Vec<A>,
+}
+
+impl<A: AsRef<dyn Array>> Chunk<A> {
+    /// Creates a new [`Chunk`].
+    /// # Panic
+    /// Iff the arrays do not have the same length
+    pub fn new(arrays: Vec<A>) -> Self {
+        Self::try_new(arrays).unwrap()
+    }
+
+    /// Creates a new [`Chunk`].
+    /// # Error
+    /// Iff the arrays do not have the same length
+    pub fn try_new(arrays: Vec<A>) -> Result<Self> {
+        if !arrays.is_empty() {
+            let len = arrays.first().unwrap().as_ref().len();
+            if arrays
+                .iter()
+                .map(|array| array.as_ref())
+                .any(|array| array.len() != len)
+            {
+                return Err(Error::InvalidArgumentError(
+                    "Chunk require all its arrays to have an equal number of rows".to_string(),
+                ));
+            }
+        }
+        Ok(Self { arrays })
+    }
+
+    /// returns the [`Array`]s in [`Chunk`]
+    pub fn arrays(&self) -> &[A] {
+        &self.arrays
+    }
+
+    /// returns the [`Array`]s in [`Chunk`]
+    pub fn columns(&self) -> &[A] {
+        &self.arrays
+    }
+
+    /// returns the number of rows of every array
+    pub fn len(&self) -> usize {
+        self.arrays
+            .first()
+            .map(|x| x.as_ref().len())
+            .unwrap_or_default()
+    }
+
+    /// returns whether the columns have any rows
+    pub fn is_empty(&self) -> bool {
+        self.len() == 0
+    }
+
+    /// Consumes [`Chunk`] into its underlying arrays.
+    /// The arrays are guaranteed to have the same length
+    pub fn into_arrays(self) -> Vec<A> {
+        self.arrays
+    }
+}
+
+impl<A: AsRef<dyn Array>> From<Chunk<A>> for Vec<A> {
+    fn from(c: Chunk<A>) -> Self {
+        c.into_arrays()
+    }
+}
+
+impl<A: AsRef<dyn Array>> std::ops::Deref for Chunk<A> {
+    type Target = [A];
+
+    #[inline]
+    fn deref(&self) -> &[A] {
+        self.arrays()
+    }
+}
diff --git a/crates/nano-arrow/src/compute/README.md b/crates/nano-arrow/src/compute/README.md
new file mode 100644
index 000000000000..6b5bec7e703e
--- /dev/null
+++ b/crates/nano-arrow/src/compute/README.md
@@ -0,0 +1,32 @@
+# Design
+
+This document outlines the design guide lines of this module.
+
+This module is composed by independent operations common in analytics. Below are some design of its principles:
+
+- APIs MUST return an error when either:
+  - The arguments are incorrect
+  - The execution results in a predictable error (e.g. divide by zero)
+
+- APIs MAY error when an operation overflows (e.g. `i32 + i32`)
+
+- kernels MUST NOT have side-effects
+
+- kernels MUST NOT take ownership of any of its arguments (i.e. everything must be a reference).
+
+- APIs SHOULD error when an operation on variable sized containers can overflow the maximum size of `usize`.
+
+- Kernels SHOULD use the arrays' logical type to decide whether kernels
+  can be applied on an array. For example, `Date32 + Date32` is meaningless and SHOULD NOT be implemented.
+
+- Kernels SHOULD be implemented via `clone`, `slice` or the `iterator` API provided by `Buffer`, `Bitmap`, `Vec` or `MutableBitmap`.
+
+- Kernels MUST NOT use any API to read bits other than the ones provided by `Bitmap`.
+
+- Implementations SHOULD aim for auto-vectorization, which is usually accomplished via `from_trusted_len_iter`.
+
+- Implementations MUST feature-gate any implementation that requires external dependencies
+
+- When a kernel accepts dynamically-typed arrays, it MUST expect them as `&dyn Array`.
+
+- When an API returns `&dyn Array`, it MUST return `Box<dyn Array>`. The rational is that a `Box` is mutable, while an `Arc` is not. As such, `Box` offers the most flexible API to consumers and the compiler. Users can cast a `Box` into `Arc` via `.into()`.
diff --git a/crates/nano-arrow/src/compute/aggregate/memory.rs b/crates/nano-arrow/src/compute/aggregate/memory.rs
new file mode 100644
index 000000000000..3af974a79b14
--- /dev/null
+++ b/crates/nano-arrow/src/compute/aggregate/memory.rs
@@ -0,0 +1,118 @@
+use crate::array::*;
+use crate::bitmap::Bitmap;
+use crate::datatypes::PhysicalType;
+
+fn validity_size(validity: Option<&Bitmap>) -> usize {
+    validity.as_ref().map(|b| b.as_slice().0.len()).unwrap_or(0)
+}
+
+macro_rules! dyn_binary {
+    ($array:expr, $ty:ty, $o:ty) => {{
+        let array = $array.as_any().downcast_ref::<$ty>().unwrap();
+        let offsets = array.offsets().buffer();
+
+        // in case of Binary/Utf8/List the offsets are sliced,
+        // not the values buffer
+        let values_start = offsets[0] as usize;
+        let values_end = offsets[offsets.len() - 1] as usize;
+
+        values_end - values_start
+            + offsets.len() * std::mem::size_of::<$o>()
+            + validity_size(array.validity())
+    }};
+}
+
+/// Returns the total (heap) allocated size of the array in bytes.
+/// # Implementation
+/// This estimation is the sum of the size of its buffers, validity, including nested arrays.
+/// Multiple arrays may share buffers and bitmaps. Therefore, the size of 2 arrays is not the
+/// sum of the sizes computed from this function. In particular, [`StructArray`]'s size is an upper bound.
+///
+/// When an array is sliced, its allocated size remains constant because the buffer unchanged.
+/// However, this function will yield a smaller number. This is because this function returns
+/// the visible size of the buffer, not its total capacity.
+///
+/// FFI buffers are included in this estimation.
+pub fn estimated_bytes_size(array: &dyn Array) -> usize {
+    use PhysicalType::*;
+    match array.data_type().to_physical_type() {
+        Null => 0,
+        Boolean => {
+            let array = array.as_any().downcast_ref::<BooleanArray>().unwrap();
+            array.values().as_slice().0.len() + validity_size(array.validity())
+        },
+        Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+            let array = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<$T>>()
+                .unwrap();
+
+            array.values().len() * std::mem::size_of::<$T>() + validity_size(array.validity())
+        }),
+        Binary => dyn_binary!(array, BinaryArray<i32>, i32),
+        FixedSizeBinary => {
+            let array = array
+                .as_any()
+                .downcast_ref::<FixedSizeBinaryArray>()
+                .unwrap();
+            array.values().len() + validity_size(array.validity())
+        },
+        LargeBinary => dyn_binary!(array, BinaryArray<i64>, i64),
+        Utf8 => dyn_binary!(array, Utf8Array<i32>, i32),
+        LargeUtf8 => dyn_binary!(array, Utf8Array<i64>, i64),
+        List => {
+            let array = array.as_any().downcast_ref::<ListArray<i32>>().unwrap();
+            estimated_bytes_size(array.values().as_ref())
+                + array.offsets().len_proxy() * std::mem::size_of::<i32>()
+                + validity_size(array.validity())
+        },
+        FixedSizeList => {
+            let array = array.as_any().downcast_ref::<FixedSizeListArray>().unwrap();
+            estimated_bytes_size(array.values().as_ref()) + validity_size(array.validity())
+        },
+        LargeList => {
+            let array = array.as_any().downcast_ref::<ListArray<i64>>().unwrap();
+            estimated_bytes_size(array.values().as_ref())
+                + array.offsets().len_proxy() * std::mem::size_of::<i64>()
+                + validity_size(array.validity())
+        },
+        Struct => {
+            let array = array.as_any().downcast_ref::<StructArray>().unwrap();
+            array
+                .values()
+                .iter()
+                .map(|x| x.as_ref())
+                .map(estimated_bytes_size)
+                .sum::<usize>()
+                + validity_size(array.validity())
+        },
+        Union => {
+            let array = array.as_any().downcast_ref::<UnionArray>().unwrap();
+            let types = array.types().len() * std::mem::size_of::<i8>();
+            let offsets = array
+                .offsets()
+                .as_ref()
+                .map(|x| x.len() * std::mem::size_of::<i32>())
+                .unwrap_or_default();
+            let fields = array
+                .fields()
+                .iter()
+                .map(|x| x.as_ref())
+                .map(estimated_bytes_size)
+                .sum::<usize>();
+            types + offsets + fields
+        },
+        Dictionary(key_type) => match_integer_type!(key_type, |$T| {
+            let array = array
+                .as_any()
+                .downcast_ref::<DictionaryArray<$T>>()
+                .unwrap();
+            estimated_bytes_size(array.keys()) + estimated_bytes_size(array.values().as_ref())
+        }),
+        Map => {
+            let array = array.as_any().downcast_ref::<MapArray>().unwrap();
+            let offsets = array.offsets().len_proxy() * std::mem::size_of::<i32>();
+            offsets + estimated_bytes_size(array.field().as_ref()) + validity_size(array.validity())
+        },
+    }
+}
diff --git a/crates/nano-arrow/src/compute/aggregate/min_max.rs b/crates/nano-arrow/src/compute/aggregate/min_max.rs
new file mode 100644
index 000000000000..e733c6657ccd
--- /dev/null
+++ b/crates/nano-arrow/src/compute/aggregate/min_max.rs
@@ -0,0 +1,416 @@
+#![allow(clippy::redundant_closure_call)]
+use multiversion::multiversion;
+
+use crate::array::{Array, BinaryArray, BooleanArray, PrimitiveArray, Utf8Array};
+use crate::bitmap::utils::{BitChunkIterExact, BitChunksExact};
+use crate::bitmap::Bitmap;
+use crate::datatypes::{DataType, PhysicalType, PrimitiveType};
+use crate::error::{Error, Result};
+use crate::offset::Offset;
+use crate::scalar::*;
+use crate::types::simd::*;
+use crate::types::NativeType;
+
+/// Trait describing a type describing multiple lanes with an order relationship
+/// consistent with the same order of `T`.
+pub trait SimdOrd<T> {
+    /// The minimum value
+    const MIN: T;
+    /// The maximum value
+    const MAX: T;
+    /// reduce itself to the minimum
+    fn max_element(self) -> T;
+    /// reduce itself to the maximum
+    fn min_element(self) -> T;
+    /// lane-wise maximum between two instances
+    fn max_lane(self, x: Self) -> Self;
+    /// lane-wise minimum between two instances
+    fn min_lane(self, x: Self) -> Self;
+    /// returns a new instance with all lanes equal to `MIN`
+    fn new_min() -> Self;
+    /// returns a new instance with all lanes equal to `MAX`
+    fn new_max() -> Self;
+}
+
+#[multiversion(targets = "simd")]
+fn nonnull_min_primitive<T>(values: &[T]) -> T
+where
+    T: NativeType + Simd,
+    T::Simd: SimdOrd<T>,
+{
+    let chunks = values.chunks_exact(T::Simd::LANES);
+    let remainder = chunks.remainder();
+
+    let chunk_reduced = chunks.fold(T::Simd::new_min(), |acc, chunk| {
+        let chunk = T::Simd::from_chunk(chunk);
+        acc.min_lane(chunk)
+    });
+
+    let remainder = T::Simd::from_incomplete_chunk(remainder, T::Simd::MAX);
+    let reduced = chunk_reduced.min_lane(remainder);
+
+    reduced.min_element()
+}
+
+#[multiversion(targets = "simd")]
+fn null_min_primitive_impl<T, I>(values: &[T], mut validity_masks: I) -> T
+where
+    T: NativeType + Simd,
+    T::Simd: SimdOrd<T>,
+    I: BitChunkIterExact<<<T as Simd>::Simd as NativeSimd>::Chunk>,
+{
+    let mut chunks = values.chunks_exact(T::Simd::LANES);
+
+    let chunk_reduced = chunks.by_ref().zip(validity_masks.by_ref()).fold(
+        T::Simd::new_min(),
+        |acc, (chunk, validity_chunk)| {
+            let chunk = T::Simd::from_chunk(chunk);
+            let mask = <T::Simd as NativeSimd>::Mask::from_chunk(validity_chunk);
+            let chunk = chunk.select(mask, T::Simd::new_min());
+            acc.min_lane(chunk)
+        },
+    );
+
+    let remainder = T::Simd::from_incomplete_chunk(chunks.remainder(), T::Simd::MAX);
+    let mask = <T::Simd as NativeSimd>::Mask::from_chunk(validity_masks.remainder());
+    let remainder = remainder.select(mask, T::Simd::new_min());
+    let reduced = chunk_reduced.min_lane(remainder);
+
+    reduced.min_element()
+}
+
+/// # Panics
+/// iff `values.len() != bitmap.len()` or the operation overflows.
+fn null_min_primitive<T>(values: &[T], bitmap: &Bitmap) -> T
+where
+    T: NativeType + Simd,
+    T::Simd: SimdOrd<T>,
+{
+    let (slice, offset, length) = bitmap.as_slice();
+    if offset == 0 {
+        let validity_masks = BitChunksExact::<<T::Simd as NativeSimd>::Chunk>::new(slice, length);
+        null_min_primitive_impl(values, validity_masks)
+    } else {
+        let validity_masks = bitmap.chunks::<<T::Simd as NativeSimd>::Chunk>();
+        null_min_primitive_impl(values, validity_masks)
+    }
+}
+
+/// # Panics
+/// iff `values.len() != bitmap.len()` or the operation overflows.
+fn null_max_primitive<T>(values: &[T], bitmap: &Bitmap) -> T
+where
+    T: NativeType + Simd,
+    T::Simd: SimdOrd<T>,
+{
+    let (slice, offset, length) = bitmap.as_slice();
+    if offset == 0 {
+        let validity_masks = BitChunksExact::<<T::Simd as NativeSimd>::Chunk>::new(slice, length);
+        null_max_primitive_impl(values, validity_masks)
+    } else {
+        let validity_masks = bitmap.chunks::<<T::Simd as NativeSimd>::Chunk>();
+        null_max_primitive_impl(values, validity_masks)
+    }
+}
+
+#[multiversion(targets = "simd")]
+fn nonnull_max_primitive<T>(values: &[T]) -> T
+where
+    T: NativeType + Simd,
+    T::Simd: SimdOrd<T>,
+{
+    let chunks = values.chunks_exact(T::Simd::LANES);
+    let remainder = chunks.remainder();
+
+    let chunk_reduced = chunks.fold(T::Simd::new_max(), |acc, chunk| {
+        let chunk = T::Simd::from_chunk(chunk);
+        acc.max_lane(chunk)
+    });
+
+    let remainder = T::Simd::from_incomplete_chunk(remainder, T::Simd::MIN);
+    let reduced = chunk_reduced.max_lane(remainder);
+
+    reduced.max_element()
+}
+
+#[multiversion(targets = "simd")]
+fn null_max_primitive_impl<T, I>(values: &[T], mut validity_masks: I) -> T
+where
+    T: NativeType + Simd,
+    T::Simd: SimdOrd<T>,
+    I: BitChunkIterExact<<<T as Simd>::Simd as NativeSimd>::Chunk>,
+{
+    let mut chunks = values.chunks_exact(T::Simd::LANES);
+
+    let chunk_reduced = chunks.by_ref().zip(validity_masks.by_ref()).fold(
+        T::Simd::new_max(),
+        |acc, (chunk, validity_chunk)| {
+            let chunk = T::Simd::from_chunk(chunk);
+            let mask = <T::Simd as NativeSimd>::Mask::from_chunk(validity_chunk);
+            let chunk = chunk.select(mask, T::Simd::new_max());
+            acc.max_lane(chunk)
+        },
+    );
+
+    let remainder = T::Simd::from_incomplete_chunk(chunks.remainder(), T::Simd::MIN);
+    let mask = <T::Simd as NativeSimd>::Mask::from_chunk(validity_masks.remainder());
+    let remainder = remainder.select(mask, T::Simd::new_max());
+    let reduced = chunk_reduced.max_lane(remainder);
+
+    reduced.max_element()
+}
+
+/// Returns the minimum value in the array, according to the natural order.
+/// For floating point arrays any NaN values are considered to be greater than any other non-null value
+pub fn min_primitive<T>(array: &PrimitiveArray<T>) -> Option<T>
+where
+    T: NativeType + Simd,
+    T::Simd: SimdOrd<T>,
+{
+    let null_count = array.null_count();
+
+    // Includes case array.len() == 0
+    if null_count == array.len() {
+        return None;
+    }
+    let values = array.values();
+
+    Some(if let Some(validity) = array.validity() {
+        null_min_primitive(values, validity)
+    } else {
+        nonnull_min_primitive(values)
+    })
+}
+
+/// Returns the maximum value in the array, according to the natural order.
+/// For floating point arrays any NaN values are considered to be greater than any other non-null value
+pub fn max_primitive<T>(array: &PrimitiveArray<T>) -> Option<T>
+where
+    T: NativeType + Simd,
+    T::Simd: SimdOrd<T>,
+{
+    let null_count = array.null_count();
+
+    // Includes case array.len() == 0
+    if null_count == array.len() {
+        return None;
+    }
+    let values = array.values();
+
+    Some(if let Some(validity) = array.validity() {
+        null_max_primitive(values, validity)
+    } else {
+        nonnull_max_primitive(values)
+    })
+}
+
+/// Helper to compute min/max of [`BinaryArray`] and [`Utf8Array`]
+macro_rules! min_max_binary_utf8 {
+    ($array: expr, $cmp: expr) => {
+        if $array.null_count() == $array.len() {
+            None
+        } else if $array.validity().is_some() {
+            $array
+                .iter()
+                .reduce(|v1, v2| match (v1, v2) {
+                    (None, v2) => v2,
+                    (v1, None) => v1,
+                    (Some(v1), Some(v2)) => {
+                        if $cmp(v1, v2) {
+                            Some(v2)
+                        } else {
+                            Some(v1)
+                        }
+                    },
+                })
+                .unwrap_or(None)
+        } else {
+            $array
+                .values_iter()
+                .reduce(|v1, v2| if $cmp(v1, v2) { v2 } else { v1 })
+        }
+    };
+}
+
+/// Returns the maximum value in the binary array, according to the natural order.
+pub fn max_binary<O: Offset>(array: &BinaryArray<O>) -> Option<&[u8]> {
+    min_max_binary_utf8!(array, |a, b| a < b)
+}
+
+/// Returns the minimum value in the binary array, according to the natural order.
+pub fn min_binary<O: Offset>(array: &BinaryArray<O>) -> Option<&[u8]> {
+    min_max_binary_utf8!(array, |a, b| a > b)
+}
+
+/// Returns the maximum value in the string array, according to the natural order.
+pub fn max_string<O: Offset>(array: &Utf8Array<O>) -> Option<&str> {
+    min_max_binary_utf8!(array, |a, b| a < b)
+}
+
+/// Returns the minimum value in the string array, according to the natural order.
+pub fn min_string<O: Offset>(array: &Utf8Array<O>) -> Option<&str> {
+    min_max_binary_utf8!(array, |a, b| a > b)
+}
+
+/// Returns the minimum value in the boolean array.
+///
+/// ```
+/// use arrow2::{
+///   array::BooleanArray,
+///   compute::aggregate::min_boolean,
+/// };
+///
+/// let a = BooleanArray::from(vec![Some(true), None, Some(false)]);
+/// assert_eq!(min_boolean(&a), Some(false))
+/// ```
+pub fn min_boolean(array: &BooleanArray) -> Option<bool> {
+    // short circuit if all nulls / zero length array
+    let null_count = array.null_count();
+    if null_count == array.len() {
+        None
+    } else if null_count == 0 {
+        Some(array.values().unset_bits() == 0)
+    } else {
+        // Note the min bool is false (0), so short circuit as soon as we see it
+        array
+            .iter()
+            .find(|&b| b == Some(false))
+            .flatten()
+            .or(Some(true))
+    }
+}
+
+/// Returns the maximum value in the boolean array
+///
+/// ```
+/// use arrow2::{
+///   array::BooleanArray,
+///   compute::aggregate::max_boolean,
+/// };
+///
+/// let a = BooleanArray::from(vec![Some(true), None, Some(false)]);
+/// assert_eq!(max_boolean(&a), Some(true))
+/// ```
+pub fn max_boolean(array: &BooleanArray) -> Option<bool> {
+    // short circuit if all nulls / zero length array
+    let null_count = array.null_count();
+    if null_count == array.len() {
+        None
+    } else if null_count == 0 {
+        Some(array.values().unset_bits() < array.len())
+    } else {
+        // Note the max bool is true (1), so short circuit as soon as we see it
+        array
+            .iter()
+            .find(|&b| b == Some(true))
+            .flatten()
+            .or(Some(false))
+    }
+}
+
+macro_rules! dyn_generic {
+    ($array_ty:ty, $scalar_ty:ty, $array:expr, $f:ident) => {{
+        let array = $array.as_any().downcast_ref::<$array_ty>().unwrap();
+        Box::new(<$scalar_ty>::new($f(array)))
+    }};
+}
+
+macro_rules! with_match_primitive_type {(
+    $key_type:expr, | $_:tt $T:ident | $($body:tt)*
+) => ({
+    macro_rules! __with_ty__ {( $_ $T:ident ) => ( $($body)* )}
+    use crate::datatypes::PrimitiveType::*;
+    match $key_type {
+        Int8 => __with_ty__! { i8 },
+        Int16 => __with_ty__! { i16 },
+        Int32 => __with_ty__! { i32 },
+        Int64 => __with_ty__! { i64 },
+        Int128 => __with_ty__! { i128 },
+        UInt8 => __with_ty__! { u8 },
+        UInt16 => __with_ty__! { u16 },
+        UInt32 => __with_ty__! { u32 },
+        UInt64 => __with_ty__! { u64 },
+        Float32 => __with_ty__! { f32 },
+        Float64 => __with_ty__! { f64 },
+        _ => return Err(Error::InvalidArgumentError(format!(
+            "`min` and `max` operator do not support primitive `{:?}`",
+            $key_type,
+        ))),
+    }
+})}
+
+/// Returns the maximum of [`Array`]. The scalar is null when all elements are null.
+/// # Error
+/// Errors iff the type does not support this operation.
+pub fn max(array: &dyn Array) -> Result<Box<dyn Scalar>> {
+    Ok(match array.data_type().to_physical_type() {
+        PhysicalType::Boolean => dyn_generic!(BooleanArray, BooleanScalar, array, max_boolean),
+        PhysicalType::Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+            let data_type = array.data_type().clone();
+            let array = array.as_any().downcast_ref().unwrap();
+            Box::new(PrimitiveScalar::<$T>::new(data_type, max_primitive::<$T>(array)))
+        }),
+        PhysicalType::Utf8 => dyn_generic!(Utf8Array<i32>, Utf8Scalar<i32>, array, max_string),
+        PhysicalType::LargeUtf8 => dyn_generic!(Utf8Array<i64>, Utf8Scalar<i64>, array, max_string),
+        PhysicalType::Binary => {
+            dyn_generic!(BinaryArray<i32>, BinaryScalar<i32>, array, max_binary)
+        },
+        PhysicalType::LargeBinary => {
+            dyn_generic!(BinaryArray<i64>, BinaryScalar<i64>, array, min_binary)
+        },
+        _ => {
+            return Err(Error::InvalidArgumentError(format!(
+                "The `max` operator does not support type `{:?}`",
+                array.data_type(),
+            )))
+        },
+    })
+}
+
+/// Returns the minimum of [`Array`]. The scalar is null when all elements are null.
+/// # Error
+/// Errors iff the type does not support this operation.
+pub fn min(array: &dyn Array) -> Result<Box<dyn Scalar>> {
+    Ok(match array.data_type().to_physical_type() {
+        PhysicalType::Boolean => dyn_generic!(BooleanArray, BooleanScalar, array, min_boolean),
+        PhysicalType::Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+            let data_type = array.data_type().clone();
+            let array = array.as_any().downcast_ref().unwrap();
+            Box::new(PrimitiveScalar::<$T>::new(data_type, min_primitive::<$T>(array)))
+        }),
+        PhysicalType::Utf8 => dyn_generic!(Utf8Array<i32>, Utf8Scalar<i32>, array, min_string),
+        PhysicalType::LargeUtf8 => dyn_generic!(Utf8Array<i64>, Utf8Scalar<i64>, array, min_string),
+        PhysicalType::Binary => {
+            dyn_generic!(BinaryArray<i32>, BinaryScalar<i32>, array, min_binary)
+        },
+        PhysicalType::LargeBinary => {
+            dyn_generic!(BinaryArray<i64>, BinaryScalar<i64>, array, min_binary)
+        },
+        _ => {
+            return Err(Error::InvalidArgumentError(format!(
+                "The `max` operator does not support type `{:?}`",
+                array.data_type(),
+            )))
+        },
+    })
+}
+
+/// Whether [`min`] supports `data_type`
+pub fn can_min(data_type: &DataType) -> bool {
+    let physical = data_type.to_physical_type();
+    if let PhysicalType::Primitive(primitive) = physical {
+        use PrimitiveType::*;
+        matches!(
+            primitive,
+            Int8 | Int16 | Int64 | Int128 | UInt8 | UInt16 | UInt32 | UInt64 | Float32 | Float64
+        )
+    } else {
+        use PhysicalType::*;
+        matches!(physical, Boolean | Utf8 | LargeUtf8 | Binary | LargeBinary)
+    }
+}
+
+/// Whether [`max`] supports `data_type`
+pub fn can_max(data_type: &DataType) -> bool {
+    can_min(data_type)
+}
diff --git a/crates/nano-arrow/src/compute/aggregate/mod.rs b/crates/nano-arrow/src/compute/aggregate/mod.rs
new file mode 100644
index 000000000000..b513238f9fd9
--- /dev/null
+++ b/crates/nano-arrow/src/compute/aggregate/mod.rs
@@ -0,0 +1,15 @@
+//! Contains different aggregation functions
+#[cfg(feature = "compute_aggregate")]
+mod sum;
+#[cfg(feature = "compute_aggregate")]
+pub use sum::*;
+
+#[cfg(feature = "compute_aggregate")]
+mod min_max;
+#[cfg(feature = "compute_aggregate")]
+pub use min_max::*;
+
+mod memory;
+pub use memory::*;
+#[cfg(feature = "compute_aggregate")]
+mod simd;
diff --git a/crates/nano-arrow/src/compute/aggregate/simd/mod.rs b/crates/nano-arrow/src/compute/aggregate/simd/mod.rs
new file mode 100644
index 000000000000..25558e9a9e19
--- /dev/null
+++ b/crates/nano-arrow/src/compute/aggregate/simd/mod.rs
@@ -0,0 +1,109 @@
+use std::ops::Add;
+
+use super::{SimdOrd, Sum};
+use crate::types::simd::{i128x8, NativeSimd};
+
+macro_rules! simd_add {
+    ($simd:tt, $type:ty, $lanes:expr, $add:tt) => {
+        impl std::ops::AddAssign for $simd {
+            #[inline]
+            fn add_assign(&mut self, rhs: Self) {
+                for i in 0..$lanes {
+                    self[i] = <$type>::$add(self[i], rhs[i]);
+                }
+            }
+        }
+
+        impl std::ops::Add for $simd {
+            type Output = Self;
+
+            #[inline]
+            fn add(self, rhs: Self) -> Self::Output {
+                let mut result = Self::default();
+                for i in 0..$lanes {
+                    result[i] = <$type>::$add(self[i], rhs[i]);
+                }
+                result
+            }
+        }
+
+        impl Sum<$type> for $simd {
+            #[inline]
+            fn simd_sum(self) -> $type {
+                let mut reduced = <$type>::default();
+                (0..<$simd>::LANES).for_each(|i| {
+                    reduced += self[i];
+                });
+                reduced
+            }
+        }
+    };
+}
+
+macro_rules! simd_ord_int {
+    ($simd:tt, $type:ty) => {
+        impl SimdOrd<$type> for $simd {
+            const MIN: $type = <$type>::MIN;
+            const MAX: $type = <$type>::MAX;
+
+            #[inline]
+            fn max_element(self) -> $type {
+                self.0.iter().copied().fold(Self::MIN, <$type>::max)
+            }
+
+            #[inline]
+            fn min_element(self) -> $type {
+                self.0.iter().copied().fold(Self::MAX, <$type>::min)
+            }
+
+            #[inline]
+            fn max_lane(self, x: Self) -> Self {
+                let mut result = <$simd>::default();
+                result
+                    .0
+                    .iter_mut()
+                    .zip(self.0.iter())
+                    .zip(x.0.iter())
+                    .for_each(|((a, b), c)| *a = (*b).max(*c));
+                result
+            }
+
+            #[inline]
+            fn min_lane(self, x: Self) -> Self {
+                let mut result = <$simd>::default();
+                result
+                    .0
+                    .iter_mut()
+                    .zip(self.0.iter())
+                    .zip(x.0.iter())
+                    .for_each(|((a, b), c)| *a = (*b).min(*c));
+                result
+            }
+
+            #[inline]
+            fn new_min() -> Self {
+                Self([Self::MAX; <$simd>::LANES])
+            }
+
+            #[inline]
+            fn new_max() -> Self {
+                Self([Self::MIN; <$simd>::LANES])
+            }
+        }
+    };
+}
+
+pub(super) use {simd_add, simd_ord_int};
+
+simd_add!(i128x8, i128, 8, add);
+simd_ord_int!(i128x8, i128);
+
+#[cfg(not(feature = "simd"))]
+mod native;
+#[cfg(not(feature = "simd"))]
+pub use native::*;
+#[cfg(feature = "simd")]
+mod packed;
+#[cfg(feature = "simd")]
+#[cfg_attr(docsrs, doc(cfg(feature = "simd")))]
+pub use packed::*;
diff --git a/crates/nano-arrow/src/compute/aggregate/simd/native.rs b/crates/nano-arrow/src/compute/aggregate/simd/native.rs
new file mode 100644
index 000000000000..d6a0275f35e9
--- /dev/null
+++ b/crates/nano-arrow/src/compute/aggregate/simd/native.rs
@@ -0,0 +1,81 @@
+use std::ops::Add;
+
+use super::super::min_max::SimdOrd;
+use super::super::sum::Sum;
+use super::{simd_add, simd_ord_int};
+use crate::types::simd::*;
+
+simd_add!(u8x64, u8, 64, wrapping_add);
+simd_add!(u16x32, u16, 32, wrapping_add);
+simd_add!(u32x16, u32, 16, wrapping_add);
+simd_add!(u64x8, u64, 8, wrapping_add);
+simd_add!(i8x64, i8, 64, wrapping_add);
+simd_add!(i16x32, i16, 32, wrapping_add);
+simd_add!(i32x16, i32, 16, wrapping_add);
+simd_add!(i64x8, i64, 8, wrapping_add);
+simd_add!(f32x16, f32, 16, add);
+simd_add!(f64x8, f64, 8, add);
+
+macro_rules! simd_ord_float {
+    ($simd:tt, $type:ty) => {
+        impl SimdOrd<$type> for $simd {
+            const MIN: $type = <$type>::NAN;
+            const MAX: $type = <$type>::NAN;
+
+            #[inline]
+            fn max_element(self) -> $type {
+                self.0.iter().copied().fold(Self::MIN, <$type>::max)
+            }
+
+            #[inline]
+            fn min_element(self) -> $type {
+                self.0.iter().copied().fold(Self::MAX, <$type>::min)
+            }
+
+            #[inline]
+            fn max_lane(self, x: Self) -> Self {
+                let mut result = <$simd>::default();
+                result
+                    .0
+                    .iter_mut()
+                    .zip(self.0.iter())
+                    .zip(x.0.iter())
+                    .for_each(|((a, b), c)| *a = (*b).max(*c));
+                result
+            }
+
+            #[inline]
+            fn min_lane(self, x: Self) -> Self {
+                let mut result = <$simd>::default();
+                result
+                    .0
+                    .iter_mut()
+                    .zip(self.0.iter())
+                    .zip(x.0.iter())
+                    .for_each(|((a, b), c)| *a = (*b).min(*c));
+                result
+            }
+
+            #[inline]
+            fn new_min() -> Self {
+                Self([Self::MAX; <$simd>::LANES])
+            }
+
+            #[inline]
+            fn new_max() -> Self {
+                Self([Self::MIN; <$simd>::LANES])
+            }
+        }
+    };
+}
+
+simd_ord_int!(u8x64, u8);
+simd_ord_int!(u16x32, u16);
+simd_ord_int!(u32x16, u32);
+simd_ord_int!(u64x8, u64);
+simd_ord_int!(i8x64, i8);
+simd_ord_int!(i16x32, i16);
+simd_ord_int!(i32x16, i32);
+simd_ord_int!(i64x8, i64);
+simd_ord_float!(f32x16, f32);
+simd_ord_float!(f64x8, f64);
diff --git a/crates/nano-arrow/src/compute/aggregate/simd/packed.rs b/crates/nano-arrow/src/compute/aggregate/simd/packed.rs
new file mode 100644
index 000000000000..40094d31e239
--- /dev/null
+++ b/crates/nano-arrow/src/compute/aggregate/simd/packed.rs
@@ -0,0 +1,116 @@
+use std::simd::{SimdFloat as _, SimdInt as _, SimdOrd as _, SimdUint as _};
+
+use super::super::min_max::SimdOrd;
+use super::super::sum::Sum;
+use crate::types::simd::*;
+
+macro_rules! simd_sum {
+    ($simd:tt, $type:ty, $sum:tt) => {
+        impl Sum<$type> for $simd {
+            #[inline]
+            fn simd_sum(self) -> $type {
+                self.$sum()
+            }
+        }
+    };
+}
+
+simd_sum!(f32x16, f32, reduce_sum);
+simd_sum!(f64x8, f64, reduce_sum);
+simd_sum!(u8x64, u8, reduce_sum);
+simd_sum!(u16x32, u16, reduce_sum);
+simd_sum!(u32x16, u32, reduce_sum);
+simd_sum!(u64x8, u64, reduce_sum);
+simd_sum!(i8x64, i8, reduce_sum);
+simd_sum!(i16x32, i16, reduce_sum);
+simd_sum!(i32x16, i32, reduce_sum);
+simd_sum!(i64x8, i64, reduce_sum);
+
+macro_rules! simd_ord_int {
+    ($simd:tt, $type:ty) => {
+        impl SimdOrd<$type> for $simd {
+            const MIN: $type = <$type>::MIN;
+            const MAX: $type = <$type>::MAX;
+
+            #[inline]
+            fn max_element(self) -> $type {
+                self.reduce_max()
+            }
+
+            #[inline]
+            fn min_element(self) -> $type {
+                self.reduce_min()
+            }
+
+            #[inline]
+            fn max_lane(self, x: Self) -> Self {
+                self.simd_max(x)
+            }
+
+            #[inline]
+            fn min_lane(self, x: Self) -> Self {
+                self.simd_min(x)
+            }
+
+            #[inline]
+            fn new_min() -> Self {
+                Self::splat(Self::MAX)
+            }
+
+            #[inline]
+            fn new_max() -> Self {
+                Self::splat(Self::MIN)
+            }
+        }
+    };
+}
+
+macro_rules! simd_ord_float {
+    ($simd:tt, $type:ty) => {
+        impl SimdOrd<$type> for $simd {
+            const MIN: $type = <$type>::NAN;
+            const MAX: $type = <$type>::NAN;
+
+            #[inline]
+            fn max_element(self) -> $type {
+                self.reduce_max()
+            }
+
+            #[inline]
+            fn min_element(self) -> $type {
+                self.reduce_min()
+            }
+
+            #[inline]
+            fn max_lane(self, x: Self) -> Self {
+                self.simd_max(x)
+            }
+
+            #[inline]
+            fn min_lane(self, x: Self) -> Self {
+                self.simd_min(x)
+            }
+
+            #[inline]
+            fn new_min() -> Self {
+                Self::splat(<$type>::NAN)
+            }
+
+            #[inline]
+            fn new_max() -> Self {
+                Self::splat(<$type>::NAN)
+            }
+        }
+    };
+}
+
+simd_ord_int!(u8x64, u8);
+simd_ord_int!(u16x32, u16);
+simd_ord_int!(u32x16, u32);
+simd_ord_int!(u64x8, u64);
+simd_ord_int!(i8x64, i8);
+simd_ord_int!(i16x32, i16);
+simd_ord_int!(i32x16, i32);
+simd_ord_int!(i64x8, i64);
+simd_ord_float!(f32x16, f32);
+simd_ord_float!(f64x8, f64);
diff --git a/crates/nano-arrow/src/compute/aggregate/sum.rs b/crates/nano-arrow/src/compute/aggregate/sum.rs
new file mode 100644
index 000000000000..738440c9f0d2
--- /dev/null
+++ b/crates/nano-arrow/src/compute/aggregate/sum.rs
@@ -0,0 +1,159 @@
+use std::ops::Add;
+
+use multiversion::multiversion;
+
+use crate::array::{Array, PrimitiveArray};
+use crate::bitmap::utils::{BitChunkIterExact, BitChunksExact};
+use crate::bitmap::Bitmap;
+use crate::datatypes::{DataType, PhysicalType, PrimitiveType};
+use crate::error::{Error, Result};
+use crate::scalar::*;
+use crate::types::simd::*;
+use crate::types::NativeType;
+
+/// Object that can reduce itself to a number. This is used in the context of SIMD to reduce
+/// a MD (e.g. `[f32; 16]`) into a single number (`f32`).
+pub trait Sum<T> {
+    /// Reduces this element to a single value.
+    fn simd_sum(self) -> T;
+}
+
+#[multiversion(targets = "simd")]
+/// Compute the sum of a slice
+pub fn sum_slice<T>(values: &[T]) -> T
+where
+    T: NativeType + Simd + Add<Output = T> + std::iter::Sum<T>,
+    T::Simd: Sum<T> + Add<Output = T::Simd>,
+{
+    let (head, simd_vals, tail) = T::Simd::align(values);
+
+    let mut reduced = T::Simd::from_incomplete_chunk(&[], T::default());
+    for chunk in simd_vals {
+        reduced = reduced + *chunk;
+    }
+
+    reduced.simd_sum() + head.iter().copied().sum() + tail.iter().copied().sum()
+}
+
+/// # Panics
+/// iff `values.len() != bitmap.len()` or the operation overflows.
+#[multiversion(targets = "simd")]
+fn null_sum_impl<T, I>(values: &[T], mut validity_masks: I) -> T
+where
+    T: NativeType + Simd,
+    T::Simd: Add<Output = T::Simd> + Sum<T>,
+    I: BitChunkIterExact<<<T as Simd>::Simd as NativeSimd>::Chunk>,
+{
+    let mut chunks = values.chunks_exact(T::Simd::LANES);
+
+    let sum = chunks.by_ref().zip(validity_masks.by_ref()).fold(
+        T::Simd::default(),
+        |acc, (chunk, validity_chunk)| {
+            let chunk = T::Simd::from_chunk(chunk);
+            let mask = <T::Simd as NativeSimd>::Mask::from_chunk(validity_chunk);
+            let selected = chunk.select(mask, T::Simd::default());
+            acc + selected
+        },
+    );
+
+    let remainder = T::Simd::from_incomplete_chunk(chunks.remainder(), T::default());
+    let mask = <T::Simd as NativeSimd>::Mask::from_chunk(validity_masks.remainder());
+    let remainder = remainder.select(mask, T::Simd::default());
+    let reduced = sum + remainder;
+
+    reduced.simd_sum()
+}
+
+/// # Panics
+/// iff `values.len() != bitmap.len()` or the operation overflows.
+fn null_sum<T>(values: &[T], bitmap: &Bitmap) -> T
+where
+    T: NativeType + Simd,
+    T::Simd: Add<Output = T::Simd> + Sum<T>,
+{
+    let (slice, offset, length) = bitmap.as_slice();
+    if offset == 0 {
+        let validity_masks = BitChunksExact::<<T::Simd as NativeSimd>::Chunk>::new(slice, length);
+        null_sum_impl(values, validity_masks)
+    } else {
+        let validity_masks = bitmap.chunks::<<T::Simd as NativeSimd>::Chunk>();
+        null_sum_impl(values, validity_masks)
+    }
+}
+
+/// Returns the sum of values in the array.
+///
+/// Returns `None` if the array is empty or only contains null values.
+pub fn sum_primitive<T>(array: &PrimitiveArray<T>) -> Option<T>
+where
+    T: NativeType + Simd + Add<Output = T> + std::iter::Sum<T>,
+    T::Simd: Add<Output = T::Simd> + Sum<T>,
+{
+    let null_count = array.null_count();
+
+    if null_count == array.len() {
+        return None;
+    }
+
+    match array.validity() {
+        None => Some(sum_slice(array.values())),
+        Some(bitmap) => Some(null_sum(array.values(), bitmap)),
+    }
+}
+
+/// Whether [`sum`] supports `data_type`
+pub fn can_sum(data_type: &DataType) -> bool {
+    if let PhysicalType::Primitive(primitive) = data_type.to_physical_type() {
+        use PrimitiveType::*;
+        matches!(
+            primitive,
+            Int8 | Int16 | Int64 | Int128 | UInt8 | UInt16 | UInt32 | UInt64 | Float32 | Float64
+        )
+    } else {
+        false
+    }
+}
+
+macro_rules! with_match_primitive_type {(
+    $key_type:expr, | $_:tt $T:ident | $($body:tt)*
+) => ({
+    macro_rules! __with_ty__ {( $_ $T:ident ) => ( $($body)* )}
+    use crate::datatypes::PrimitiveType::*;
+    match $key_type {
+        Int8 => __with_ty__! { i8 },
+        Int16 => __with_ty__! { i16 },
+        Int32 => __with_ty__! { i32 },
+        Int64 => __with_ty__! { i64 },
+        Int128 => __with_ty__! { i128 },
+        UInt8 => __with_ty__! { u8 },
+        UInt16 => __with_ty__! { u16 },
+        UInt32 => __with_ty__! { u32 },
+        UInt64 => __with_ty__! { u64 },
+        Float32 => __with_ty__! { f32 },
+        Float64 => __with_ty__! { f64 },
+        _ => return Err(Error::InvalidArgumentError(format!(
+            "`sum` operator do not support primitive `{:?}`",
+            $key_type,
+        ))),
+    }
+})}
+
+/// Returns the sum of all elements in `array` as a [`Scalar`] of the same physical
+/// and logical types as `array`.
+/// # Error
+/// Errors iff the operation is not supported.
+pub fn sum(array: &dyn Array) -> Result<Box<dyn Scalar>> {
+    Ok(match array.data_type().to_physical_type() {
+        PhysicalType::Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+            let data_type = array.data_type().clone();
+            let array = array.as_any().downcast_ref().unwrap();
+            Box::new(PrimitiveScalar::new(data_type, sum_primitive::<$T>(array)))
+        }),
+        _ => {
+            return Err(Error::InvalidArgumentError(format!(
+                "The `sum` operator does not support type `{:?}`",
+                array.data_type(),
+            )))
+        },
+    })
+}
diff --git a/crates/nano-arrow/src/compute/arithmetics/basic/add.rs b/crates/nano-arrow/src/compute/arithmetics/basic/add.rs
new file mode 100644
index 000000000000..5919b65fdbd5
--- /dev/null
+++ b/crates/nano-arrow/src/compute/arithmetics/basic/add.rs
@@ -0,0 +1,337 @@
+//! Definition of basic add operations with primitive arrays
+use std::ops::Add;
+
+use num_traits::ops::overflowing::OverflowingAdd;
+use num_traits::{CheckedAdd, SaturatingAdd, WrappingAdd};
+
+use super::NativeArithmetics;
+use crate::array::PrimitiveArray;
+use crate::bitmap::Bitmap;
+use crate::compute::arithmetics::{
+    ArrayAdd, ArrayCheckedAdd, ArrayOverflowingAdd, ArraySaturatingAdd, ArrayWrappingAdd,
+};
+use crate::compute::arity::{
+    binary, binary_checked, binary_with_bitmap, unary, unary_checked, unary_with_bitmap,
+};
+
+/// Adds two primitive arrays with the same type.
+/// Panics if the sum of one pair of values overflows.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::add;
+/// use arrow2::array::PrimitiveArray;
+///
+/// let a = PrimitiveArray::from([None, Some(6), None, Some(6)]);
+/// let b = PrimitiveArray::from([Some(5), None, None, Some(6)]);
+/// let result = add(&a, &b);
+/// let expected = PrimitiveArray::from([None, None, None, Some(12)]);
+/// assert_eq!(result, expected)
+/// ```
+pub fn add<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + Add<Output = T>,
+{
+    binary(lhs, rhs, lhs.data_type().clone(), |a, b| a + b)
+}
+
+/// Wrapping addition of two [`PrimitiveArray`]s.
+/// It wraps around at the boundary of the type if the result overflows.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::wrapping_add;
+/// use arrow2::array::PrimitiveArray;
+///
+/// let a = PrimitiveArray::from([Some(-100i8), Some(100i8), Some(100i8)]);
+/// let b = PrimitiveArray::from([Some(0i8), Some(100i8), Some(0i8)]);
+/// let result = wrapping_add(&a, &b);
+/// let expected = PrimitiveArray::from([Some(-100i8), Some(-56i8), Some(100i8)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn wrapping_add<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + WrappingAdd<Output = T>,
+{
+    let op = move |a: T, b: T| a.wrapping_add(&b);
+
+    binary(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+/// Checked addition of two primitive arrays. If the result from the sum
+/// overflows, the validity for that index is changed to None
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::checked_add;
+/// use arrow2::array::PrimitiveArray;
+///
+/// let a = PrimitiveArray::from([Some(100i8), Some(100i8), Some(100i8)]);
+/// let b = PrimitiveArray::from([Some(0i8), Some(100i8), Some(0i8)]);
+/// let result = checked_add(&a, &b);
+/// let expected = PrimitiveArray::from([Some(100i8), None, Some(100i8)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn checked_add<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + CheckedAdd<Output = T>,
+{
+    let op = move |a: T, b: T| a.checked_add(&b);
+
+    binary_checked(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+/// Saturating addition of two primitive arrays. If the result from the sum is
+/// larger than the possible number for this type, the result for the operation
+/// will be the saturated value.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::saturating_add;
+/// use arrow2::array::PrimitiveArray;
+///
+/// let a = PrimitiveArray::from([Some(100i8)]);
+/// let b = PrimitiveArray::from([Some(100i8)]);
+/// let result = saturating_add(&a, &b);
+/// let expected = PrimitiveArray::from([Some(127)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn saturating_add<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + SaturatingAdd<Output = T>,
+{
+    let op = move |a: T, b: T| a.saturating_add(&b);
+
+    binary(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+/// Overflowing addition of two primitive arrays. If the result from the sum is
+/// larger than the possible number for this type, the result for the operation
+/// will be an array with overflowed values and a  validity array indicating
+/// the overflowing elements from the array.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::overflowing_add;
+/// use arrow2::array::PrimitiveArray;
+///
+/// let a = PrimitiveArray::from([Some(1i8), Some(100i8)]);
+/// let b = PrimitiveArray::from([Some(1i8), Some(100i8)]);
+/// let (result, overflow) = overflowing_add(&a, &b);
+/// let expected = PrimitiveArray::from([Some(2i8), Some(-56i8)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn overflowing_add<T>(
+    lhs: &PrimitiveArray<T>,
+    rhs: &PrimitiveArray<T>,
+) -> (PrimitiveArray<T>, Bitmap)
+where
+    T: NativeArithmetics + OverflowingAdd<Output = T>,
+{
+    let op = move |a: T, b: T| a.overflowing_add(&b);
+
+    binary_with_bitmap(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+// Implementation of ArrayAdd trait for PrimitiveArrays
+impl<T> ArrayAdd<PrimitiveArray<T>> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + Add<Output = T>,
+{
+    fn add(&self, rhs: &PrimitiveArray<T>) -> Self {
+        add(self, rhs)
+    }
+}
+
+impl<T> ArrayWrappingAdd<PrimitiveArray<T>> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + WrappingAdd<Output = T>,
+{
+    fn wrapping_add(&self, rhs: &PrimitiveArray<T>) -> Self {
+        wrapping_add(self, rhs)
+    }
+}
+
+// Implementation of ArrayCheckedAdd trait for PrimitiveArrays
+impl<T> ArrayCheckedAdd<PrimitiveArray<T>> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + CheckedAdd<Output = T>,
+{
+    fn checked_add(&self, rhs: &PrimitiveArray<T>) -> Self {
+        checked_add(self, rhs)
+    }
+}
+
+// Implementation of ArraySaturatingAdd trait for PrimitiveArrays
+impl<T> ArraySaturatingAdd<PrimitiveArray<T>> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + SaturatingAdd<Output = T>,
+{
+    fn saturating_add(&self, rhs: &PrimitiveArray<T>) -> Self {
+        saturating_add(self, rhs)
+    }
+}
+
+// Implementation of ArraySaturatingAdd trait for PrimitiveArrays
+impl<T> ArrayOverflowingAdd<PrimitiveArray<T>> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + OverflowingAdd<Output = T>,
+{
+    fn overflowing_add(&self, rhs: &PrimitiveArray<T>) -> (Self, Bitmap) {
+        overflowing_add(self, rhs)
+    }
+}
+
+/// Adds a scalar T to a primitive array of type T.
+/// Panics if the sum of the values overflows.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::add_scalar;
+/// use arrow2::array::PrimitiveArray;
+///
+/// let a = PrimitiveArray::from([None, Some(6), None, Some(6)]);
+/// let result = add_scalar(&a, &1i32);
+/// let expected = PrimitiveArray::from([None, Some(7), None, Some(7)]);
+/// assert_eq!(result, expected)
+/// ```
+pub fn add_scalar<T>(lhs: &PrimitiveArray<T>, rhs: &T) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + Add<Output = T>,
+{
+    let rhs = *rhs;
+    unary(lhs, |a| a + rhs, lhs.data_type().clone())
+}
+
+/// Wrapping addition of a scalar T to a [`PrimitiveArray`] of type T.
+/// It do nothing if the result overflows.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::wrapping_add_scalar;
+/// use arrow2::array::Int8Array;
+///
+/// let a = Int8Array::from(&[None, Some(100)]);
+/// let result = wrapping_add_scalar(&a, &100i8);
+/// let expected = Int8Array::from(&[None, Some(-56)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn wrapping_add_scalar<T>(lhs: &PrimitiveArray<T>, rhs: &T) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + WrappingAdd<Output = T>,
+{
+    unary(lhs, |a| a.wrapping_add(rhs), lhs.data_type().clone())
+}
+
+/// Checked addition of a scalar T to a primitive array of type T. If the
+/// result from the sum overflows then the validity index for that value is
+/// changed to None
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::checked_add_scalar;
+/// use arrow2::array::Int8Array;
+///
+/// let a = Int8Array::from(&[None, Some(100), None, Some(100)]);
+/// let result = checked_add_scalar(&a, &100i8);
+/// let expected = Int8Array::from(&[None, None, None, None]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn checked_add_scalar<T>(lhs: &PrimitiveArray<T>, rhs: &T) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + CheckedAdd<Output = T>,
+{
+    let rhs = *rhs;
+    let op = move |a: T| a.checked_add(&rhs);
+
+    unary_checked(lhs, op, lhs.data_type().clone())
+}
+
+/// Saturated addition of a scalar T to a primitive array of type T. If the
+/// result from the sum is larger than the possible number for this type, then
+/// the result will be saturated
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::saturating_add_scalar;
+/// use arrow2::array::PrimitiveArray;
+///
+/// let a = PrimitiveArray::from([Some(100i8)]);
+/// let result = saturating_add_scalar(&a, &100i8);
+/// let expected = PrimitiveArray::from([Some(127)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn saturating_add_scalar<T>(lhs: &PrimitiveArray<T>, rhs: &T) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + SaturatingAdd<Output = T>,
+{
+    let rhs = *rhs;
+    let op = move |a: T| a.saturating_add(&rhs);
+
+    unary(lhs, op, lhs.data_type().clone())
+}
+
+/// Overflowing addition of a scalar T to a primitive array of type T. If the
+/// result from the sum is larger than the possible number for this type, then
+/// the result will be an array with overflowed values and a validity array
+/// indicating the overflowing elements from the array
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::overflowing_add_scalar;
+/// use arrow2::array::PrimitiveArray;
+///
+/// let a = PrimitiveArray::from([Some(1i8), Some(100i8)]);
+/// let (result, overflow) = overflowing_add_scalar(&a, &100i8);
+/// let expected = PrimitiveArray::from([Some(101i8), Some(-56i8)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn overflowing_add_scalar<T>(lhs: &PrimitiveArray<T>, rhs: &T) -> (PrimitiveArray<T>, Bitmap)
+where
+    T: NativeArithmetics + OverflowingAdd<Output = T>,
+{
+    let rhs = *rhs;
+    let op = move |a: T| a.overflowing_add(&rhs);
+
+    unary_with_bitmap(lhs, op, lhs.data_type().clone())
+}
+
+// Implementation of ArrayAdd trait for PrimitiveArrays with a scalar
+impl<T> ArrayAdd<T> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + Add<Output = T>,
+{
+    fn add(&self, rhs: &T) -> Self {
+        add_scalar(self, rhs)
+    }
+}
+
+// Implementation of ArrayCheckedAdd trait for PrimitiveArrays with a scalar
+impl<T> ArrayCheckedAdd<T> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + CheckedAdd<Output = T>,
+{
+    fn checked_add(&self, rhs: &T) -> Self {
+        checked_add_scalar(self, rhs)
+    }
+}
+
+// Implementation of ArraySaturatingAdd trait for PrimitiveArrays with a scalar
+impl<T> ArraySaturatingAdd<T> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + SaturatingAdd<Output = T>,
+{
+    fn saturating_add(&self, rhs: &T) -> Self {
+        saturating_add_scalar(self, rhs)
+    }
+}
+
+// Implementation of ArraySaturatingAdd trait for PrimitiveArrays with a scalar
+impl<T> ArrayOverflowingAdd<T> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + OverflowingAdd<Output = T>,
+{
+    fn overflowing_add(&self, rhs: &T) -> (Self, Bitmap) {
+        overflowing_add_scalar(self, rhs)
+    }
+}
diff --git a/crates/nano-arrow/src/compute/arithmetics/basic/div.rs b/crates/nano-arrow/src/compute/arithmetics/basic/div.rs
new file mode 100644
index 000000000000..eb8f2ae0ac7c
--- /dev/null
+++ b/crates/nano-arrow/src/compute/arithmetics/basic/div.rs
@@ -0,0 +1,204 @@
+//! Definition of basic div operations with primitive arrays
+use std::ops::Div;
+
+use num_traits::{CheckedDiv, NumCast};
+use strength_reduce::{
+    StrengthReducedU16, StrengthReducedU32, StrengthReducedU64, StrengthReducedU8,
+};
+
+use super::NativeArithmetics;
+use crate::array::{Array, PrimitiveArray};
+use crate::compute::arithmetics::{ArrayCheckedDiv, ArrayDiv};
+use crate::compute::arity::{binary, binary_checked, unary, unary_checked};
+use crate::compute::utils::check_same_len;
+use crate::datatypes::PrimitiveType;
+
+/// Divides two primitive arrays with the same type.
+/// Panics if the divisor is zero of one pair of values overflows.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::div;
+/// use arrow2::array::Int32Array;
+///
+/// let a = Int32Array::from(&[Some(10), Some(1), Some(6)]);
+/// let b = Int32Array::from(&[Some(5), None, Some(6)]);
+/// let result = div(&a, &b);
+/// let expected = Int32Array::from(&[Some(2), None, Some(1)]);
+/// assert_eq!(result, expected)
+/// ```
+pub fn div<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + Div<Output = T>,
+{
+    if rhs.null_count() == 0 {
+        binary(lhs, rhs, lhs.data_type().clone(), |a, b| a / b)
+    } else {
+        check_same_len(lhs, rhs).unwrap();
+        let values = lhs.iter().zip(rhs.iter()).map(|(l, r)| match (l, r) {
+            (Some(l), Some(r)) => Some(*l / *r),
+            _ => None,
+        });
+
+        PrimitiveArray::from_trusted_len_iter(values).to(lhs.data_type().clone())
+    }
+}
+
+/// Checked division of two primitive arrays. If the result from the division
+/// overflows, the result for the operation will change the validity array
+/// making this operation None
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::checked_div;
+/// use arrow2::array::Int8Array;
+///
+/// let a = Int8Array::from(&[Some(-100i8), Some(10i8)]);
+/// let b = Int8Array::from(&[Some(100i8), Some(0i8)]);
+/// let result = checked_div(&a, &b);
+/// let expected = Int8Array::from(&[Some(-1i8), None]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn checked_div<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + CheckedDiv<Output = T>,
+{
+    let op = move |a: T, b: T| a.checked_div(&b);
+
+    binary_checked(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+// Implementation of ArrayDiv trait for PrimitiveArrays
+impl<T> ArrayDiv<PrimitiveArray<T>> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + Div<Output = T>,
+{
+    fn div(&self, rhs: &PrimitiveArray<T>) -> Self {
+        div(self, rhs)
+    }
+}
+
+// Implementation of ArrayCheckedDiv trait for PrimitiveArrays
+impl<T> ArrayCheckedDiv<PrimitiveArray<T>> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + CheckedDiv<Output = T>,
+{
+    fn checked_div(&self, rhs: &PrimitiveArray<T>) -> Self {
+        checked_div(self, rhs)
+    }
+}
+
+/// Divide a primitive array of type T by a scalar T.
+/// Panics if the divisor is zero.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::div_scalar;
+/// use arrow2::array::Int32Array;
+///
+/// let a = Int32Array::from(&[None, Some(6), None, Some(6)]);
+/// let result = div_scalar(&a, &2i32);
+/// let expected = Int32Array::from(&[None, Some(3), None, Some(3)]);
+/// assert_eq!(result, expected)
+/// ```
+pub fn div_scalar<T>(lhs: &PrimitiveArray<T>, rhs: &T) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + Div<Output = T> + NumCast,
+{
+    let rhs = *rhs;
+    match T::PRIMITIVE {
+        PrimitiveType::UInt64 => {
+            let lhs = lhs.as_any().downcast_ref::<PrimitiveArray<u64>>().unwrap();
+            let rhs = rhs.to_u64().unwrap();
+
+            let reduced_div = StrengthReducedU64::new(rhs);
+            let r = unary(lhs, |a| a / reduced_div, lhs.data_type().clone());
+            (&r as &dyn Array)
+                .as_any()
+                .downcast_ref::<PrimitiveArray<T>>()
+                .unwrap()
+                .clone()
+        },
+        PrimitiveType::UInt32 => {
+            let lhs = lhs.as_any().downcast_ref::<PrimitiveArray<u32>>().unwrap();
+            let rhs = rhs.to_u32().unwrap();
+
+            let reduced_div = StrengthReducedU32::new(rhs);
+            let r = unary(lhs, |a| a / reduced_div, lhs.data_type().clone());
+            (&r as &dyn Array)
+                .as_any()
+                .downcast_ref::<PrimitiveArray<T>>()
+                .unwrap()
+                .clone()
+        },
+        PrimitiveType::UInt16 => {
+            let lhs = lhs.as_any().downcast_ref::<PrimitiveArray<u16>>().unwrap();
+            let rhs = rhs.to_u16().unwrap();
+
+            let reduced_div = StrengthReducedU16::new(rhs);
+
+            let r = unary(lhs, |a| a / reduced_div, lhs.data_type().clone());
+            (&r as &dyn Array)
+                .as_any()
+                .downcast_ref::<PrimitiveArray<T>>()
+                .unwrap()
+                .clone()
+        },
+        PrimitiveType::UInt8 => {
+            let lhs = lhs.as_any().downcast_ref::<PrimitiveArray<u8>>().unwrap();
+            let rhs = rhs.to_u8().unwrap();
+
+            let reduced_div = StrengthReducedU8::new(rhs);
+            let r = unary(lhs, |a| a / reduced_div, lhs.data_type().clone());
+            (&r as &dyn Array)
+                .as_any()
+                .downcast_ref::<PrimitiveArray<T>>()
+                .unwrap()
+                .clone()
+        },
+        _ => unary(lhs, |a| a / rhs, lhs.data_type().clone()),
+    }
+}
+
+/// Checked division of a primitive array of type T by a scalar T. If the
+/// divisor is zero then the validity array is changed to None.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::checked_div_scalar;
+/// use arrow2::array::Int8Array;
+///
+/// let a = Int8Array::from(&[Some(-100i8)]);
+/// let result = checked_div_scalar(&a, &100i8);
+/// let expected = Int8Array::from(&[Some(-1i8)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn checked_div_scalar<T>(lhs: &PrimitiveArray<T>, rhs: &T) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + CheckedDiv<Output = T>,
+{
+    let rhs = *rhs;
+    let op = move |a: T| a.checked_div(&rhs);
+
+    unary_checked(lhs, op, lhs.data_type().clone())
+}
+
+// Implementation of ArrayDiv trait for PrimitiveArrays with a scalar
+impl<T> ArrayDiv<T> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + Div<Output = T> + NumCast,
+{
+    fn div(&self, rhs: &T) -> Self {
+        div_scalar(self, rhs)
+    }
+}
+
+// Implementation of ArrayCheckedDiv trait for PrimitiveArrays with a scalar
+impl<T> ArrayCheckedDiv<T> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + CheckedDiv<Output = T>,
+{
+    fn checked_div(&self, rhs: &T) -> Self {
+        checked_div_scalar(self, rhs)
+    }
+}
diff --git a/crates/nano-arrow/src/compute/arithmetics/basic/mod.rs b/crates/nano-arrow/src/compute/arithmetics/basic/mod.rs
new file mode 100644
index 000000000000..898a69f59536
--- /dev/null
+++ b/crates/nano-arrow/src/compute/arithmetics/basic/mod.rs
@@ -0,0 +1,100 @@
+//! Contains arithmetic functions for [`PrimitiveArray`]s.
+//!
+//! Each operation has four variants, like the rest of Rust's ecosystem:
+//! * usual, that [`panic!`]s on overflow
+//! * `checked_*` that turns overflowings to `None`
+//! * `overflowing_*` returning a [`Bitmap`](crate::bitmap::Bitmap) with items that overflow.
+//! * `saturating_*` that saturates the result.
+mod add;
+pub use add::*;
+mod div;
+pub use div::*;
+mod mul;
+pub use mul::*;
+mod pow;
+pub use pow::*;
+mod rem;
+pub use rem::*;
+mod sub;
+use std::ops::Neg;
+
+use num_traits::{CheckedNeg, WrappingNeg};
+pub use sub::*;
+
+use super::super::arity::{unary, unary_checked};
+use crate::array::PrimitiveArray;
+use crate::types::NativeType;
+
+/// Trait describing a [`NativeType`] whose semantics of arithmetic in Arrow equals
+/// the semantics in Rust.
+/// A counter example is `i128`, that in arrow represents a decimal while in rust represents
+/// a signed integer.
+pub trait NativeArithmetics: NativeType {}
+impl NativeArithmetics for u8 {}
+impl NativeArithmetics for u16 {}
+impl NativeArithmetics for u32 {}
+impl NativeArithmetics for u64 {}
+impl NativeArithmetics for i8 {}
+impl NativeArithmetics for i16 {}
+impl NativeArithmetics for i32 {}
+impl NativeArithmetics for i64 {}
+impl NativeArithmetics for f32 {}
+impl NativeArithmetics for f64 {}
+
+/// Negates values from array.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::negate;
+/// use arrow2::array::PrimitiveArray;
+///
+/// let a = PrimitiveArray::from([None, Some(6), None, Some(7)]);
+/// let result = negate(&a);
+/// let expected = PrimitiveArray::from([None, Some(-6), None, Some(-7)]);
+/// assert_eq!(result, expected)
+/// ```
+pub fn negate<T>(array: &PrimitiveArray<T>) -> PrimitiveArray<T>
+where
+    T: NativeType + Neg<Output = T>,
+{
+    unary(array, |a| -a, array.data_type().clone())
+}
+
+/// Checked negates values from array.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::checked_negate;
+/// use arrow2::array::{Array, PrimitiveArray};
+///
+/// let a = PrimitiveArray::from([None, Some(6), Some(i8::MIN), Some(7)]);
+/// let result = checked_negate(&a);
+/// let expected = PrimitiveArray::from([None, Some(-6), None, Some(-7)]);
+/// assert_eq!(result, expected);
+/// assert!(!result.is_valid(2))
+/// ```
+pub fn checked_negate<T>(array: &PrimitiveArray<T>) -> PrimitiveArray<T>
+where
+    T: NativeType + CheckedNeg,
+{
+    unary_checked(array, |a| a.checked_neg(), array.data_type().clone())
+}
+
+/// Wrapping negates values from array.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::wrapping_negate;
+/// use arrow2::array::{Array, PrimitiveArray};
+///
+/// let a = PrimitiveArray::from([None, Some(6), Some(i8::MIN), Some(7)]);
+/// let result = wrapping_negate(&a);
+/// let expected = PrimitiveArray::from([None, Some(-6), Some(i8::MIN), Some(-7)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn wrapping_negate<T>(array: &PrimitiveArray<T>) -> PrimitiveArray<T>
+where
+    T: NativeType + WrappingNeg,
+{
+    unary(array, |a| a.wrapping_neg(), array.data_type().clone())
+}
diff --git a/crates/nano-arrow/src/compute/arithmetics/basic/mul.rs b/crates/nano-arrow/src/compute/arithmetics/basic/mul.rs
new file mode 100644
index 000000000000..e006abe186e5
--- /dev/null
+++ b/crates/nano-arrow/src/compute/arithmetics/basic/mul.rs
@@ -0,0 +1,338 @@
+//! Definition of basic mul operations with primitive arrays
+use std::ops::Mul;
+
+use num_traits::ops::overflowing::OverflowingMul;
+use num_traits::{CheckedMul, SaturatingMul, WrappingMul};
+
+use super::NativeArithmetics;
+use crate::array::PrimitiveArray;
+use crate::bitmap::Bitmap;
+use crate::compute::arithmetics::{
+    ArrayCheckedMul, ArrayMul, ArrayOverflowingMul, ArraySaturatingMul, ArrayWrappingMul,
+};
+use crate::compute::arity::{
+    binary, binary_checked, binary_with_bitmap, unary, unary_checked, unary_with_bitmap,
+};
+
+/// Multiplies two primitive arrays with the same type.
+/// Panics if the multiplication of one pair of values overflows.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::mul;
+/// use arrow2::array::Int32Array;
+///
+/// let a = Int32Array::from(&[None, Some(6), None, Some(6)]);
+/// let b = Int32Array::from(&[Some(5), None, None, Some(6)]);
+/// let result = mul(&a, &b);
+/// let expected = Int32Array::from(&[None, None, None, Some(36)]);
+/// assert_eq!(result, expected)
+/// ```
+pub fn mul<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + Mul<Output = T>,
+{
+    binary(lhs, rhs, lhs.data_type().clone(), |a, b| a * b)
+}
+
+/// Wrapping multiplication of two [`PrimitiveArray`]s.
+///  It wraps around at the boundary of the type if the result overflows.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::wrapping_mul;
+/// use arrow2::array::PrimitiveArray;
+///
+/// let a = PrimitiveArray::from([Some(100i8), Some(0x10i8), Some(100i8)]);
+/// let b = PrimitiveArray::from([Some(0i8), Some(0x10i8), Some(0i8)]);
+/// let result = wrapping_mul(&a, &b);
+/// let expected = PrimitiveArray::from([Some(0), Some(0), Some(0)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn wrapping_mul<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + WrappingMul<Output = T>,
+{
+    let op = move |a: T, b: T| a.wrapping_mul(&b);
+
+    binary(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+/// Checked multiplication of two primitive arrays. If the result from the
+/// multiplications overflows, the validity for that index is changed
+/// returned.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::checked_mul;
+/// use arrow2::array::Int8Array;
+///
+/// let a = Int8Array::from(&[Some(100i8), Some(100i8), Some(100i8)]);
+/// let b = Int8Array::from(&[Some(1i8), Some(100i8), Some(1i8)]);
+/// let result = checked_mul(&a, &b);
+/// let expected = Int8Array::from(&[Some(100i8), None, Some(100i8)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn checked_mul<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + CheckedMul<Output = T>,
+{
+    let op = move |a: T, b: T| a.checked_mul(&b);
+
+    binary_checked(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+/// Saturating multiplication of two primitive arrays. If the result from the
+/// multiplication overflows, the result for the
+/// operation will be the saturated value.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::saturating_mul;
+/// use arrow2::array::Int8Array;
+///
+/// let a = Int8Array::from(&[Some(-100i8)]);
+/// let b = Int8Array::from(&[Some(100i8)]);
+/// let result = saturating_mul(&a, &b);
+/// let expected = Int8Array::from(&[Some(-128)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn saturating_mul<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + SaturatingMul<Output = T>,
+{
+    let op = move |a: T, b: T| a.saturating_mul(&b);
+
+    binary(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+/// Overflowing multiplication of two primitive arrays. If the result from the
+/// mul overflows, the result for the operation will be an array with
+/// overflowed values and a validity array indicating the overflowing elements
+/// from the array.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::overflowing_mul;
+/// use arrow2::array::Int8Array;
+///
+/// let a = Int8Array::from(&[Some(1i8), Some(-100i8)]);
+/// let b = Int8Array::from(&[Some(1i8), Some(100i8)]);
+/// let (result, overflow) = overflowing_mul(&a, &b);
+/// let expected = Int8Array::from(&[Some(1i8), Some(-16i8)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn overflowing_mul<T>(
+    lhs: &PrimitiveArray<T>,
+    rhs: &PrimitiveArray<T>,
+) -> (PrimitiveArray<T>, Bitmap)
+where
+    T: NativeArithmetics + OverflowingMul<Output = T>,
+{
+    let op = move |a: T, b: T| a.overflowing_mul(&b);
+
+    binary_with_bitmap(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+// Implementation of ArrayMul trait for PrimitiveArrays
+impl<T> ArrayMul<PrimitiveArray<T>> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + Mul<Output = T>,
+{
+    fn mul(&self, rhs: &PrimitiveArray<T>) -> Self {
+        mul(self, rhs)
+    }
+}
+
+impl<T> ArrayWrappingMul<PrimitiveArray<T>> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + WrappingMul<Output = T>,
+{
+    fn wrapping_mul(&self, rhs: &PrimitiveArray<T>) -> Self {
+        wrapping_mul(self, rhs)
+    }
+}
+
+// Implementation of ArrayCheckedMul trait for PrimitiveArrays
+impl<T> ArrayCheckedMul<PrimitiveArray<T>> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + CheckedMul<Output = T>,
+{
+    fn checked_mul(&self, rhs: &PrimitiveArray<T>) -> Self {
+        checked_mul(self, rhs)
+    }
+}
+
+// Implementation of ArraySaturatingMul trait for PrimitiveArrays
+impl<T> ArraySaturatingMul<PrimitiveArray<T>> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + SaturatingMul<Output = T>,
+{
+    fn saturating_mul(&self, rhs: &PrimitiveArray<T>) -> Self {
+        saturating_mul(self, rhs)
+    }
+}
+
+// Implementation of ArraySaturatingMul trait for PrimitiveArrays
+impl<T> ArrayOverflowingMul<PrimitiveArray<T>> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + OverflowingMul<Output = T>,
+{
+    fn overflowing_mul(&self, rhs: &PrimitiveArray<T>) -> (Self, Bitmap) {
+        overflowing_mul(self, rhs)
+    }
+}
+
+/// Multiply a scalar T to a primitive array of type T.
+/// Panics if the multiplication of the values overflows.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::mul_scalar;
+/// use arrow2::array::Int32Array;
+///
+/// let a = Int32Array::from(&[None, Some(6), None, Some(6)]);
+/// let result = mul_scalar(&a, &2i32);
+/// let expected = Int32Array::from(&[None, Some(12), None, Some(12)]);
+/// assert_eq!(result, expected)
+/// ```
+pub fn mul_scalar<T>(lhs: &PrimitiveArray<T>, rhs: &T) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + Mul<Output = T>,
+{
+    let rhs = *rhs;
+    unary(lhs, |a| a * rhs, lhs.data_type().clone())
+}
+
+/// Wrapping multiplication of a scalar T to a [`PrimitiveArray`] of type T.
+/// It do nothing if the result overflows.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::wrapping_mul_scalar;
+/// use arrow2::array::Int8Array;
+///
+/// let a = Int8Array::from(&[None, Some(0x10)]);
+/// let result = wrapping_mul_scalar(&a, &0x10);
+/// let expected = Int8Array::from(&[None, Some(0)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn wrapping_mul_scalar<T>(lhs: &PrimitiveArray<T>, rhs: &T) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + WrappingMul<Output = T>,
+{
+    unary(lhs, |a| a.wrapping_mul(rhs), lhs.data_type().clone())
+}
+
+/// Checked multiplication of a scalar T to a primitive array of type T. If the
+/// result from the multiplication overflows, then the validity for that index is
+/// changed to None
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::checked_mul_scalar;
+/// use arrow2::array::Int8Array;
+///
+/// let a = Int8Array::from(&[None, Some(100), None, Some(100)]);
+/// let result = checked_mul_scalar(&a, &100i8);
+/// let expected = Int8Array::from(&[None, None, None, None]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn checked_mul_scalar<T>(lhs: &PrimitiveArray<T>, rhs: &T) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + CheckedMul<Output = T>,
+{
+    let rhs = *rhs;
+    let op = move |a: T| a.checked_mul(&rhs);
+
+    unary_checked(lhs, op, lhs.data_type().clone())
+}
+
+/// Saturated multiplication of a scalar T to a primitive array of type T. If the
+/// result from the mul overflows for this type, then
+/// the result will be saturated
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::saturating_mul_scalar;
+/// use arrow2::array::Int8Array;
+///
+/// let a = Int8Array::from(&[Some(-100i8)]);
+/// let result = saturating_mul_scalar(&a, &100i8);
+/// let expected = Int8Array::from(&[Some(-128i8)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn saturating_mul_scalar<T>(lhs: &PrimitiveArray<T>, rhs: &T) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + SaturatingMul<Output = T>,
+{
+    let rhs = *rhs;
+    let op = move |a: T| a.saturating_mul(&rhs);
+
+    unary(lhs, op, lhs.data_type().clone())
+}
+
+/// Overflowing multiplication of a scalar T to a primitive array of type T. If
+/// the result from the mul overflows for this type,
+/// then the result will be an array with overflowed values and a validity
+/// array indicating the overflowing elements from the array
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::overflowing_mul_scalar;
+/// use arrow2::array::Int8Array;
+///
+/// let a = Int8Array::from(&[Some(1i8), Some(100i8)]);
+/// let (result, overflow) = overflowing_mul_scalar(&a, &100i8);
+/// let expected = Int8Array::from(&[Some(100i8), Some(16i8)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn overflowing_mul_scalar<T>(lhs: &PrimitiveArray<T>, rhs: &T) -> (PrimitiveArray<T>, Bitmap)
+where
+    T: NativeArithmetics + OverflowingMul<Output = T>,
+{
+    let rhs = *rhs;
+    let op = move |a: T| a.overflowing_mul(&rhs);
+
+    unary_with_bitmap(lhs, op, lhs.data_type().clone())
+}
+
+// Implementation of ArrayMul trait for PrimitiveArrays with a scalar
+impl<T> ArrayMul<T> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + Mul<Output = T>,
+{
+    fn mul(&self, rhs: &T) -> Self {
+        mul_scalar(self, rhs)
+    }
+}
+
+// Implementation of ArrayCheckedMul trait for PrimitiveArrays with a scalar
+impl<T> ArrayCheckedMul<T> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + CheckedMul<Output = T>,
+{
+    fn checked_mul(&self, rhs: &T) -> Self {
+        checked_mul_scalar(self, rhs)
+    }
+}
+
+// Implementation of ArraySaturatingMul trait for PrimitiveArrays with a scalar
+impl<T> ArraySaturatingMul<T> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + SaturatingMul<Output = T>,
+{
+    fn saturating_mul(&self, rhs: &T) -> Self {
+        saturating_mul_scalar(self, rhs)
+    }
+}
+
+// Implementation of ArraySaturatingMul trait for PrimitiveArrays with a scalar
+impl<T> ArrayOverflowingMul<T> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + OverflowingMul<Output = T>,
+{
+    fn overflowing_mul(&self, rhs: &T) -> (Self, Bitmap) {
+        overflowing_mul_scalar(self, rhs)
+    }
+}
diff --git a/crates/nano-arrow/src/compute/arithmetics/basic/pow.rs b/crates/nano-arrow/src/compute/arithmetics/basic/pow.rs
new file mode 100644
index 000000000000..ea8908db6a51
--- /dev/null
+++ b/crates/nano-arrow/src/compute/arithmetics/basic/pow.rs
@@ -0,0 +1,49 @@
+//! Definition of basic pow operations with primitive arrays
+use num_traits::{checked_pow, CheckedMul, One, Pow};
+
+use super::NativeArithmetics;
+use crate::array::PrimitiveArray;
+use crate::compute::arity::{unary, unary_checked};
+
+/// Raises an array of primitives to the power of exponent. Panics if one of
+/// the values values overflows.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::powf_scalar;
+/// use arrow2::array::Float32Array;
+///
+/// let a = Float32Array::from(&[Some(2f32), None]);
+/// let actual = powf_scalar(&a, 2.0);
+/// let expected = Float32Array::from(&[Some(4f32), None]);
+/// assert_eq!(expected, actual);
+/// ```
+pub fn powf_scalar<T>(array: &PrimitiveArray<T>, exponent: T) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + Pow<T, Output = T>,
+{
+    unary(array, |x| x.pow(exponent), array.data_type().clone())
+}
+
+/// Checked operation of raising an array of primitives to the power of
+/// exponent. If the result from the multiplications overflows, the validity
+/// for that index is changed returned.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::checked_powf_scalar;
+/// use arrow2::array::Int8Array;
+///
+/// let a = Int8Array::from(&[Some(1i8), None, Some(7i8)]);
+/// let actual = checked_powf_scalar(&a, 8usize);
+/// let expected = Int8Array::from(&[Some(1i8), None, None]);
+/// assert_eq!(expected, actual);
+/// ```
+pub fn checked_powf_scalar<T>(array: &PrimitiveArray<T>, exponent: usize) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + CheckedMul + One,
+{
+    let op = move |a: T| checked_pow(a, exponent);
+
+    unary_checked(array, op, array.data_type().clone())
+}
diff --git a/crates/nano-arrow/src/compute/arithmetics/basic/rem.rs b/crates/nano-arrow/src/compute/arithmetics/basic/rem.rs
new file mode 100644
index 000000000000..6c400fce2b07
--- /dev/null
+++ b/crates/nano-arrow/src/compute/arithmetics/basic/rem.rs
@@ -0,0 +1,196 @@
+use std::ops::Rem;
+
+use num_traits::{CheckedRem, NumCast};
+use strength_reduce::{
+    StrengthReducedU16, StrengthReducedU32, StrengthReducedU64, StrengthReducedU8,
+};
+
+use super::NativeArithmetics;
+use crate::array::{Array, PrimitiveArray};
+use crate::compute::arithmetics::{ArrayCheckedRem, ArrayRem};
+use crate::compute::arity::{binary, binary_checked, unary, unary_checked};
+use crate::datatypes::PrimitiveType;
+
+/// Remainder of two primitive arrays with the same type.
+/// Panics if the divisor is zero of one pair of values overflows.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::rem;
+/// use arrow2::array::Int32Array;
+///
+/// let a = Int32Array::from(&[Some(10), Some(7)]);
+/// let b = Int32Array::from(&[Some(5), Some(6)]);
+/// let result = rem(&a, &b);
+/// let expected = Int32Array::from(&[Some(0), Some(1)]);
+/// assert_eq!(result, expected)
+/// ```
+pub fn rem<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + Rem<Output = T>,
+{
+    binary(lhs, rhs, lhs.data_type().clone(), |a, b| a % b)
+}
+
+/// Checked remainder of two primitive arrays. If the result from the remainder
+/// overflows, the result for the operation will change the validity array
+/// making this operation None
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::checked_rem;
+/// use arrow2::array::Int8Array;
+///
+/// let a = Int8Array::from(&[Some(-100i8), Some(10i8)]);
+/// let b = Int8Array::from(&[Some(100i8), Some(0i8)]);
+/// let result = checked_rem(&a, &b);
+/// let expected = Int8Array::from(&[Some(-0i8), None]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn checked_rem<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + CheckedRem<Output = T>,
+{
+    let op = move |a: T, b: T| a.checked_rem(&b);
+
+    binary_checked(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+impl<T> ArrayRem<PrimitiveArray<T>> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + Rem<Output = T>,
+{
+    fn rem(&self, rhs: &PrimitiveArray<T>) -> Self {
+        rem(self, rhs)
+    }
+}
+
+impl<T> ArrayCheckedRem<PrimitiveArray<T>> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + CheckedRem<Output = T>,
+{
+    fn checked_rem(&self, rhs: &PrimitiveArray<T>) -> Self {
+        checked_rem(self, rhs)
+    }
+}
+
+/// Remainder a primitive array of type T by a scalar T.
+/// Panics if the divisor is zero.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::rem_scalar;
+/// use arrow2::array::Int32Array;
+///
+/// let a = Int32Array::from(&[None, Some(6), None, Some(7)]);
+/// let result = rem_scalar(&a, &2i32);
+/// let expected = Int32Array::from(&[None, Some(0), None, Some(1)]);
+/// assert_eq!(result, expected)
+/// ```
+pub fn rem_scalar<T>(lhs: &PrimitiveArray<T>, rhs: &T) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + Rem<Output = T> + NumCast,
+{
+    let rhs = *rhs;
+
+    match T::PRIMITIVE {
+        PrimitiveType::UInt64 => {
+            let lhs = lhs.as_any().downcast_ref::<PrimitiveArray<u64>>().unwrap();
+            let rhs = rhs.to_u64().unwrap();
+
+            let reduced_rem = StrengthReducedU64::new(rhs);
+
+            // small hack to avoid a transmute of `PrimitiveArray<u64>` to `PrimitiveArray<T>`
+            let r = unary(lhs, |a| a % reduced_rem, lhs.data_type().clone());
+            (&r as &dyn Array)
+                .as_any()
+                .downcast_ref::<PrimitiveArray<T>>()
+                .unwrap()
+                .clone()
+        },
+        PrimitiveType::UInt32 => {
+            let lhs = lhs.as_any().downcast_ref::<PrimitiveArray<u32>>().unwrap();
+            let rhs = rhs.to_u32().unwrap();
+
+            let reduced_rem = StrengthReducedU32::new(rhs);
+
+            let r = unary(lhs, |a| a % reduced_rem, lhs.data_type().clone());
+            // small hack to avoid an unsafe transmute of `PrimitiveArray<u64>` to `PrimitiveArray<T>`
+            (&r as &dyn Array)
+                .as_any()
+                .downcast_ref::<PrimitiveArray<T>>()
+                .unwrap()
+                .clone()
+        },
+        PrimitiveType::UInt16 => {
+            let lhs = lhs.as_any().downcast_ref::<PrimitiveArray<u16>>().unwrap();
+            let rhs = rhs.to_u16().unwrap();
+
+            let reduced_rem = StrengthReducedU16::new(rhs);
+
+            let r = unary(lhs, |a| a % reduced_rem, lhs.data_type().clone());
+            // small hack to avoid an unsafe transmute of `PrimitiveArray<u16>` to `PrimitiveArray<T>`
+            (&r as &dyn Array)
+                .as_any()
+                .downcast_ref::<PrimitiveArray<T>>()
+                .unwrap()
+                .clone()
+        },
+        PrimitiveType::UInt8 => {
+            let lhs = lhs.as_any().downcast_ref::<PrimitiveArray<u8>>().unwrap();
+            let rhs = rhs.to_u8().unwrap();
+
+            let reduced_rem = StrengthReducedU8::new(rhs);
+
+            let r = unary(lhs, |a| a % reduced_rem, lhs.data_type().clone());
+            // small hack to avoid an unsafe transmute of `PrimitiveArray<u8>` to `PrimitiveArray<T>`
+            (&r as &dyn Array)
+                .as_any()
+                .downcast_ref::<PrimitiveArray<T>>()
+                .unwrap()
+                .clone()
+        },
+        _ => unary(lhs, |a| a % rhs, lhs.data_type().clone()),
+    }
+}
+
+/// Checked remainder of a primitive array of type T by a scalar T. If the
+/// divisor is zero then the validity array is changed to None.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::checked_rem_scalar;
+/// use arrow2::array::Int8Array;
+///
+/// let a = Int8Array::from(&[Some(-100i8)]);
+/// let result = checked_rem_scalar(&a, &100i8);
+/// let expected = Int8Array::from(&[Some(0i8)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn checked_rem_scalar<T>(lhs: &PrimitiveArray<T>, rhs: &T) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + CheckedRem<Output = T>,
+{
+    let rhs = *rhs;
+    let op = move |a: T| a.checked_rem(&rhs);
+
+    unary_checked(lhs, op, lhs.data_type().clone())
+}
+
+impl<T> ArrayRem<T> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + Rem<Output = T> + NumCast,
+{
+    fn rem(&self, rhs: &T) -> Self {
+        rem_scalar(self, rhs)
+    }
+}
+
+impl<T> ArrayCheckedRem<T> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + CheckedRem<Output = T>,
+{
+    fn checked_rem(&self, rhs: &T) -> Self {
+        checked_rem_scalar(self, rhs)
+    }
+}
diff --git a/crates/nano-arrow/src/compute/arithmetics/basic/sub.rs b/crates/nano-arrow/src/compute/arithmetics/basic/sub.rs
new file mode 100644
index 000000000000..5b2dcd36cb25
--- /dev/null
+++ b/crates/nano-arrow/src/compute/arithmetics/basic/sub.rs
@@ -0,0 +1,337 @@
+//! Definition of basic sub operations with primitive arrays
+use std::ops::Sub;
+
+use num_traits::ops::overflowing::OverflowingSub;
+use num_traits::{CheckedSub, SaturatingSub, WrappingSub};
+
+use super::NativeArithmetics;
+use crate::array::PrimitiveArray;
+use crate::bitmap::Bitmap;
+use crate::compute::arithmetics::{
+    ArrayCheckedSub, ArrayOverflowingSub, ArraySaturatingSub, ArraySub, ArrayWrappingSub,
+};
+use crate::compute::arity::{
+    binary, binary_checked, binary_with_bitmap, unary, unary_checked, unary_with_bitmap,
+};
+
+/// Subtracts two primitive arrays with the same type.
+/// Panics if the subtraction of one pair of values overflows.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::sub;
+/// use arrow2::array::Int32Array;
+///
+/// let a = Int32Array::from(&[None, Some(6), None, Some(6)]);
+/// let b = Int32Array::from(&[Some(5), None, None, Some(6)]);
+/// let result = sub(&a, &b);
+/// let expected = Int32Array::from(&[None, None, None, Some(0)]);
+/// assert_eq!(result, expected)
+/// ```
+pub fn sub<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + Sub<Output = T>,
+{
+    binary(lhs, rhs, lhs.data_type().clone(), |a, b| a - b)
+}
+
+/// Wrapping subtraction of two [`PrimitiveArray`]s.
+///  It wraps around at the boundary of the type if the result overflows.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::wrapping_sub;
+/// use arrow2::array::PrimitiveArray;
+///
+/// let a = PrimitiveArray::from([Some(-100i8), Some(-100i8), Some(100i8)]);
+/// let b = PrimitiveArray::from([Some(0i8), Some(100i8), Some(0i8)]);
+/// let result = wrapping_sub(&a, &b);
+/// let expected = PrimitiveArray::from([Some(-100i8), Some(56i8), Some(100i8)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn wrapping_sub<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + WrappingSub<Output = T>,
+{
+    let op = move |a: T, b: T| a.wrapping_sub(&b);
+
+    binary(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+/// Checked subtraction of two primitive arrays. If the result from the
+/// subtraction overflow, the validity for that index is changed
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::checked_sub;
+/// use arrow2::array::Int8Array;
+///
+/// let a = Int8Array::from(&[Some(100i8), Some(-100i8), Some(100i8)]);
+/// let b = Int8Array::from(&[Some(1i8), Some(100i8), Some(0i8)]);
+/// let result = checked_sub(&a, &b);
+/// let expected = Int8Array::from(&[Some(99i8), None, Some(100i8)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn checked_sub<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + CheckedSub<Output = T>,
+{
+    let op = move |a: T, b: T| a.checked_sub(&b);
+
+    binary_checked(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+/// Saturating subtraction of two primitive arrays. If the result from the sub
+/// is smaller than the possible number for this type, the result for the
+/// operation will be the saturated value.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::saturating_sub;
+/// use arrow2::array::Int8Array;
+///
+/// let a = Int8Array::from(&[Some(-100i8)]);
+/// let b = Int8Array::from(&[Some(100i8)]);
+/// let result = saturating_sub(&a, &b);
+/// let expected = Int8Array::from(&[Some(-128)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn saturating_sub<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + SaturatingSub<Output = T>,
+{
+    let op = move |a: T, b: T| a.saturating_sub(&b);
+
+    binary(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+/// Overflowing subtraction of two primitive arrays. If the result from the sub
+/// is smaller than the possible number for this type, the result for the
+/// operation will be an array with overflowed values and a validity array
+/// indicating the overflowing elements from the array.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::overflowing_sub;
+/// use arrow2::array::Int8Array;
+///
+/// let a = Int8Array::from(&[Some(1i8), Some(-100i8)]);
+/// let b = Int8Array::from(&[Some(1i8), Some(100i8)]);
+/// let (result, overflow) = overflowing_sub(&a, &b);
+/// let expected = Int8Array::from(&[Some(0i8), Some(56i8)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn overflowing_sub<T>(
+    lhs: &PrimitiveArray<T>,
+    rhs: &PrimitiveArray<T>,
+) -> (PrimitiveArray<T>, Bitmap)
+where
+    T: NativeArithmetics + OverflowingSub<Output = T>,
+{
+    let op = move |a: T, b: T| a.overflowing_sub(&b);
+
+    binary_with_bitmap(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+// Implementation of ArraySub trait for PrimitiveArrays
+impl<T> ArraySub<PrimitiveArray<T>> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + Sub<Output = T>,
+{
+    fn sub(&self, rhs: &PrimitiveArray<T>) -> Self {
+        sub(self, rhs)
+    }
+}
+
+impl<T> ArrayWrappingSub<PrimitiveArray<T>> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + WrappingSub<Output = T>,
+{
+    fn wrapping_sub(&self, rhs: &PrimitiveArray<T>) -> Self {
+        wrapping_sub(self, rhs)
+    }
+}
+
+// Implementation of ArrayCheckedSub trait for PrimitiveArrays
+impl<T> ArrayCheckedSub<PrimitiveArray<T>> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + CheckedSub<Output = T>,
+{
+    fn checked_sub(&self, rhs: &PrimitiveArray<T>) -> Self {
+        checked_sub(self, rhs)
+    }
+}
+
+// Implementation of ArraySaturatingSub trait for PrimitiveArrays
+impl<T> ArraySaturatingSub<PrimitiveArray<T>> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + SaturatingSub<Output = T>,
+{
+    fn saturating_sub(&self, rhs: &PrimitiveArray<T>) -> Self {
+        saturating_sub(self, rhs)
+    }
+}
+
+// Implementation of ArraySaturatingSub trait for PrimitiveArrays
+impl<T> ArrayOverflowingSub<PrimitiveArray<T>> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + OverflowingSub<Output = T>,
+{
+    fn overflowing_sub(&self, rhs: &PrimitiveArray<T>) -> (Self, Bitmap) {
+        overflowing_sub(self, rhs)
+    }
+}
+
+/// Subtract a scalar T to a primitive array of type T.
+/// Panics if the subtraction of the values overflows.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::sub_scalar;
+/// use arrow2::array::Int32Array;
+///
+/// let a = Int32Array::from(&[None, Some(6), None, Some(6)]);
+/// let result = sub_scalar(&a, &1i32);
+/// let expected = Int32Array::from(&[None, Some(5), None, Some(5)]);
+/// assert_eq!(result, expected)
+/// ```
+pub fn sub_scalar<T>(lhs: &PrimitiveArray<T>, rhs: &T) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + Sub<Output = T>,
+{
+    let rhs = *rhs;
+    unary(lhs, |a| a - rhs, lhs.data_type().clone())
+}
+
+/// Wrapping subtraction of a scalar T to a [`PrimitiveArray`] of type T.
+/// It do nothing if the result overflows.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::wrapping_sub_scalar;
+/// use arrow2::array::Int8Array;
+///
+/// let a = Int8Array::from(&[None, Some(-100)]);
+/// let result = wrapping_sub_scalar(&a, &100i8);
+/// let expected = Int8Array::from(&[None, Some(56)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn wrapping_sub_scalar<T>(lhs: &PrimitiveArray<T>, rhs: &T) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + WrappingSub<Output = T>,
+{
+    unary(lhs, |a| a.wrapping_sub(rhs), lhs.data_type().clone())
+}
+
+/// Checked subtraction of a scalar T to a primitive array of type T. If the
+/// result from the subtraction overflows, then the validity for that index
+/// is changed to None
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::checked_sub_scalar;
+/// use arrow2::array::Int8Array;
+///
+/// let a = Int8Array::from(&[None, Some(-100), None, Some(-100)]);
+/// let result = checked_sub_scalar(&a, &100i8);
+/// let expected = Int8Array::from(&[None, None, None, None]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn checked_sub_scalar<T>(lhs: &PrimitiveArray<T>, rhs: &T) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + CheckedSub<Output = T>,
+{
+    let rhs = *rhs;
+    let op = move |a: T| a.checked_sub(&rhs);
+
+    unary_checked(lhs, op, lhs.data_type().clone())
+}
+
+/// Saturated subtraction of a scalar T to a primitive array of type T. If the
+/// result from the sub is smaller than the possible number for this type, then
+/// the result will be saturated
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::saturating_sub_scalar;
+/// use arrow2::array::Int8Array;
+///
+/// let a = Int8Array::from(&[Some(-100i8)]);
+/// let result = saturating_sub_scalar(&a, &100i8);
+/// let expected = Int8Array::from(&[Some(-128i8)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn saturating_sub_scalar<T>(lhs: &PrimitiveArray<T>, rhs: &T) -> PrimitiveArray<T>
+where
+    T: NativeArithmetics + SaturatingSub<Output = T>,
+{
+    let rhs = *rhs;
+    let op = move |a: T| a.saturating_sub(&rhs);
+
+    unary(lhs, op, lhs.data_type().clone())
+}
+
+/// Overflowing subtraction of a scalar T to a primitive array of type T. If
+/// the result from the sub is smaller than the possible number for this type,
+/// then the result will be an array with overflowed values and a validity
+/// array indicating the overflowing elements from the array
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::basic::overflowing_sub_scalar;
+/// use arrow2::array::Int8Array;
+///
+/// let a = Int8Array::from(&[Some(1i8), Some(-100i8)]);
+/// let (result, overflow) = overflowing_sub_scalar(&a, &100i8);
+/// let expected = Int8Array::from(&[Some(-99i8), Some(56i8)]);
+/// assert_eq!(result, expected);
+/// ```
+pub fn overflowing_sub_scalar<T>(lhs: &PrimitiveArray<T>, rhs: &T) -> (PrimitiveArray<T>, Bitmap)
+where
+    T: NativeArithmetics + OverflowingSub<Output = T>,
+{
+    let rhs = *rhs;
+    let op = move |a: T| a.overflowing_sub(&rhs);
+
+    unary_with_bitmap(lhs, op, lhs.data_type().clone())
+}
+
+// Implementation of ArraySub trait for PrimitiveArrays with a scalar
+impl<T> ArraySub<T> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + Sub<Output = T>,
+{
+    fn sub(&self, rhs: &T) -> Self {
+        sub_scalar(self, rhs)
+    }
+}
+
+// Implementation of ArrayCheckedSub trait for PrimitiveArrays with a scalar
+impl<T> ArrayCheckedSub<T> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + CheckedSub<Output = T>,
+{
+    fn checked_sub(&self, rhs: &T) -> Self {
+        checked_sub_scalar(self, rhs)
+    }
+}
+
+// Implementation of ArraySaturatingSub trait for PrimitiveArrays with a scalar
+impl<T> ArraySaturatingSub<T> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + SaturatingSub<Output = T>,
+{
+    fn saturating_sub(&self, rhs: &T) -> Self {
+        saturating_sub_scalar(self, rhs)
+    }
+}
+
+// Implementation of ArraySaturatingSub trait for PrimitiveArrays with a scalar
+impl<T> ArrayOverflowingSub<T> for PrimitiveArray<T>
+where
+    T: NativeArithmetics + OverflowingSub<Output = T>,
+{
+    fn overflowing_sub(&self, rhs: &T) -> (Self, Bitmap) {
+        overflowing_sub_scalar(self, rhs)
+    }
+}
diff --git a/crates/nano-arrow/src/compute/arithmetics/decimal/add.rs b/crates/nano-arrow/src/compute/arithmetics/decimal/add.rs
new file mode 100644
index 000000000000..dccdb6b144c1
--- /dev/null
+++ b/crates/nano-arrow/src/compute/arithmetics/decimal/add.rs
@@ -0,0 +1,236 @@
+//! Defines the addition arithmetic kernels for [`PrimitiveArray`] representing decimals.
+use super::{adjusted_precision_scale, get_parameters, max_value, number_digits};
+use crate::array::PrimitiveArray;
+use crate::compute::arithmetics::{ArrayAdd, ArrayCheckedAdd, ArraySaturatingAdd};
+use crate::compute::arity::{binary, binary_checked};
+use crate::compute::utils::{check_same_len, combine_validities};
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+
+/// Adds two decimal [`PrimitiveArray`] with the same precision and scale.
+/// # Error
+/// Errors if the precision and scale are different.
+/// # Panic
+/// This function panics iff the added numbers result in a number larger than
+/// the possible number for the precision.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::decimal::add;
+/// use arrow2::array::PrimitiveArray;
+/// use arrow2::datatypes::DataType;
+///
+/// let a = PrimitiveArray::from([Some(1i128), Some(1i128), None, Some(2i128)]).to(DataType::Decimal(5, 2));
+/// let b = PrimitiveArray::from([Some(1i128), Some(2i128), None, Some(2i128)]).to(DataType::Decimal(5, 2));
+///
+/// let result = add(&a, &b);
+/// let expected = PrimitiveArray::from([Some(2i128), Some(3i128), None, Some(4i128)]).to(DataType::Decimal(5, 2));
+///
+/// assert_eq!(result, expected);
+/// ```
+pub fn add(lhs: &PrimitiveArray<i128>, rhs: &PrimitiveArray<i128>) -> PrimitiveArray<i128> {
+    let (precision, _) = get_parameters(lhs.data_type(), rhs.data_type()).unwrap();
+
+    let max = max_value(precision);
+    let op = move |a, b| {
+        let res: i128 = a + b;
+
+        assert!(
+            res.abs() <= max,
+            "Overflow in addition presented for precision {precision}"
+        );
+
+        res
+    };
+
+    binary(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+/// Saturated addition of two decimal primitive arrays with the same precision
+/// and scale. If the precision and scale is different, then an
+/// InvalidArgumentError is returned. If the result from the sum is larger than
+/// the possible number with the selected precision then the resulted number in
+/// the arrow array is the maximum number for the selected precision.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::decimal::saturating_add;
+/// use arrow2::array::PrimitiveArray;
+/// use arrow2::datatypes::DataType;
+///
+/// let a = PrimitiveArray::from([Some(99000i128), Some(11100i128), None, Some(22200i128)]).to(DataType::Decimal(5, 2));
+/// let b = PrimitiveArray::from([Some(01000i128), Some(22200i128), None, Some(11100i128)]).to(DataType::Decimal(5, 2));
+///
+/// let result = saturating_add(&a, &b);
+/// let expected = PrimitiveArray::from([Some(99999i128), Some(33300i128), None, Some(33300i128)]).to(DataType::Decimal(5, 2));
+///
+/// assert_eq!(result, expected);
+/// ```
+pub fn saturating_add(
+    lhs: &PrimitiveArray<i128>,
+    rhs: &PrimitiveArray<i128>,
+) -> PrimitiveArray<i128> {
+    let (precision, _) = get_parameters(lhs.data_type(), rhs.data_type()).unwrap();
+
+    let max = max_value(precision);
+    let op = move |a, b| {
+        let res: i128 = a + b;
+
+        if res.abs() > max {
+            if res > 0 {
+                max
+            } else {
+                -max
+            }
+        } else {
+            res
+        }
+    };
+
+    binary(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+/// Checked addition of two decimal primitive arrays with the same precision
+/// and scale. If the precision and scale is different, then an
+/// InvalidArgumentError is returned. If the result from the sum is larger than
+/// the possible number with the selected precision (overflowing), then the
+/// validity for that index is changed to None
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::decimal::checked_add;
+/// use arrow2::array::PrimitiveArray;
+/// use arrow2::datatypes::DataType;
+///
+/// let a = PrimitiveArray::from([Some(99000i128), Some(11100i128), None, Some(22200i128)]).to(DataType::Decimal(5, 2));
+/// let b = PrimitiveArray::from([Some(01000i128), Some(22200i128), None, Some(11100i128)]).to(DataType::Decimal(5, 2));
+///
+/// let result = checked_add(&a, &b);
+/// let expected = PrimitiveArray::from([None, Some(33300i128), None, Some(33300i128)]).to(DataType::Decimal(5, 2));
+///
+/// assert_eq!(result, expected);
+/// ```
+pub fn checked_add(lhs: &PrimitiveArray<i128>, rhs: &PrimitiveArray<i128>) -> PrimitiveArray<i128> {
+    let (precision, _) = get_parameters(lhs.data_type(), rhs.data_type()).unwrap();
+
+    let max = max_value(precision);
+    let op = move |a, b| {
+        let result: i128 = a + b;
+
+        if result.abs() > max {
+            None
+        } else {
+            Some(result)
+        }
+    };
+
+    binary_checked(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+// Implementation of ArrayAdd trait for PrimitiveArrays
+impl ArrayAdd<PrimitiveArray<i128>> for PrimitiveArray<i128> {
+    fn add(&self, rhs: &PrimitiveArray<i128>) -> Self {
+        add(self, rhs)
+    }
+}
+
+// Implementation of ArrayCheckedAdd trait for PrimitiveArrays
+impl ArrayCheckedAdd<PrimitiveArray<i128>> for PrimitiveArray<i128> {
+    fn checked_add(&self, rhs: &PrimitiveArray<i128>) -> Self {
+        checked_add(self, rhs)
+    }
+}
+
+// Implementation of ArraySaturatingAdd trait for PrimitiveArrays
+impl ArraySaturatingAdd<PrimitiveArray<i128>> for PrimitiveArray<i128> {
+    fn saturating_add(&self, rhs: &PrimitiveArray<i128>) -> Self {
+        saturating_add(self, rhs)
+    }
+}
+
+/// Adaptive addition of two decimal primitive arrays with different precision
+/// and scale. If the precision and scale is different, then the smallest scale
+/// and precision is adjusted to the largest precision and scale. If during the
+/// addition one of the results is larger than the max possible value, the
+/// result precision is changed to the precision of the max value
+///
+/// ```nocode
+/// 11111.11   -> 7, 2
+/// 11111.111  -> 8, 3
+/// ------------------
+/// 22222.221  -> 8, 3
+/// ```
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::decimal::adaptive_add;
+/// use arrow2::array::PrimitiveArray;
+/// use arrow2::datatypes::DataType;
+///
+/// let a = PrimitiveArray::from([Some(11111_11i128)]).to(DataType::Decimal(7, 2));
+/// let b = PrimitiveArray::from([Some(11111_111i128)]).to(DataType::Decimal(8, 3));
+/// let result = adaptive_add(&a, &b).unwrap();
+/// let expected = PrimitiveArray::from([Some(22222_221i128)]).to(DataType::Decimal(8, 3));
+///
+/// assert_eq!(result, expected);
+/// ```
+pub fn adaptive_add(
+    lhs: &PrimitiveArray<i128>,
+    rhs: &PrimitiveArray<i128>,
+) -> Result<PrimitiveArray<i128>> {
+    check_same_len(lhs, rhs)?;
+
+    let (lhs_p, lhs_s, rhs_p, rhs_s) =
+        if let (DataType::Decimal(lhs_p, lhs_s), DataType::Decimal(rhs_p, rhs_s)) =
+            (lhs.data_type(), rhs.data_type())
+        {
+            (*lhs_p, *lhs_s, *rhs_p, *rhs_s)
+        } else {
+            return Err(Error::InvalidArgumentError(
+                "Incorrect data type for the array".to_string(),
+            ));
+        };
+
+    // The resulting precision is mutable because it could change while
+    // looping through the iterator
+    let (mut res_p, res_s, diff) = adjusted_precision_scale(lhs_p, lhs_s, rhs_p, rhs_s);
+
+    let shift = 10i128.pow(diff as u32);
+    let mut max = max_value(res_p);
+
+    let values = lhs
+        .values()
+        .iter()
+        .zip(rhs.values().iter())
+        .map(|(l, r)| {
+            // Based on the array's scales one of the arguments in the sum has to be shifted
+            // to the left to match the final scale
+            let res = if lhs_s > rhs_s {
+                l + r * shift
+            } else {
+                l * shift + r
+            };
+
+            // The precision of the resulting array will change if one of the
+            // sums during the iteration produces a value bigger than the
+            // possible value for the initial precision
+
+            //  99.9999 -> 6, 4
+            //  00.0001 -> 6, 4
+            // -----------------
+            // 100.0000 -> 7, 4
+            if res.abs() > max {
+                res_p = number_digits(res);
+                max = max_value(res_p);
+            }
+            res
+        })
+        .collect::<Vec<_>>();
+
+    let validity = combine_validities(lhs.validity(), rhs.validity());
+
+    Ok(PrimitiveArray::<i128>::new(
+        DataType::Decimal(res_p, res_s),
+        values.into(),
+        validity,
+    ))
+}
diff --git a/crates/nano-arrow/src/compute/arithmetics/decimal/div.rs b/crates/nano-arrow/src/compute/arithmetics/decimal/div.rs
new file mode 100644
index 000000000000..1576fc061947
--- /dev/null
+++ b/crates/nano-arrow/src/compute/arithmetics/decimal/div.rs
@@ -0,0 +1,302 @@
+//! Defines the division arithmetic kernels for Decimal
+//! `PrimitiveArrays`.
+
+use super::{adjusted_precision_scale, get_parameters, max_value, number_digits};
+use crate::array::PrimitiveArray;
+use crate::compute::arithmetics::{ArrayCheckedDiv, ArrayDiv};
+use crate::compute::arity::{binary, binary_checked, unary};
+use crate::compute::utils::{check_same_len, combine_validities};
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+use crate::scalar::{PrimitiveScalar, Scalar};
+
+/// Divide two decimal primitive arrays with the same precision and scale. If
+/// the precision and scale is different, then an InvalidArgumentError is
+/// returned. This function panics if the dividend is divided by 0 or None.
+/// This function also panics if the division produces a number larger
+/// than the possible number for the array precision.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::decimal::div;
+/// use arrow2::array::PrimitiveArray;
+/// use arrow2::datatypes::DataType;
+///
+/// let a = PrimitiveArray::from([Some(1_00i128), Some(4_00i128), Some(6_00i128)]).to(DataType::Decimal(5, 2));
+/// let b = PrimitiveArray::from([Some(1_00i128), Some(2_00i128), Some(2_00i128)]).to(DataType::Decimal(5, 2));
+///
+/// let result = div(&a, &b);
+/// let expected = PrimitiveArray::from([Some(1_00i128), Some(2_00i128), Some(3_00i128)]).to(DataType::Decimal(5, 2));
+///
+/// assert_eq!(result, expected);
+/// ```
+pub fn div(lhs: &PrimitiveArray<i128>, rhs: &PrimitiveArray<i128>) -> PrimitiveArray<i128> {
+    let (precision, scale) = get_parameters(lhs.data_type(), rhs.data_type()).unwrap();
+
+    let scale = 10i128.pow(scale as u32);
+    let max = max_value(precision);
+    let op = move |a: i128, b: i128| {
+        // The division is done using the numbers without scale.
+        // The dividend is scaled up to maintain precision after the
+        // division
+
+        //   222.222 -->  222222000
+        //   123.456 -->     123456
+        // --------       ---------
+        //     1.800 <--       1800
+        let numeral: i128 = a * scale;
+
+        // The division can overflow if the dividend is divided
+        // by zero.
+        let res: i128 = numeral.checked_div(b).expect("Found division by zero");
+
+        assert!(
+            res.abs() <= max,
+            "Overflow in multiplication presented for precision {precision}"
+        );
+
+        res
+    };
+
+    binary(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+/// Multiply a decimal [`PrimitiveArray`] with a [`PrimitiveScalar`] with the same precision and scale. If
+/// the precision and scale is different, then an InvalidArgumentError is
+/// returned. This function panics if the multiplied numbers result in a number
+/// larger than the possible number for the selected precision.
+pub fn div_scalar(lhs: &PrimitiveArray<i128>, rhs: &PrimitiveScalar<i128>) -> PrimitiveArray<i128> {
+    let (precision, scale) = get_parameters(lhs.data_type(), rhs.data_type()).unwrap();
+
+    let rhs = if let Some(rhs) = *rhs.value() {
+        rhs
+    } else {
+        return PrimitiveArray::<i128>::new_null(lhs.data_type().clone(), lhs.len());
+    };
+
+    let scale = 10i128.pow(scale as u32);
+    let max = max_value(precision);
+
+    let op = move |a: i128| {
+        // The division is done using the numbers without scale.
+        // The dividend is scaled up to maintain precision after the
+        // division
+
+        //   222.222 -->  222222000
+        //   123.456 -->     123456
+        // --------       ---------
+        //     1.800 <--       1800
+        let numeral: i128 = a * scale;
+
+        // The division can overflow if the dividend is divided
+        // by zero.
+        let res: i128 = numeral.checked_div(rhs).expect("Found division by zero");
+
+        assert!(
+            res.abs() <= max,
+            "Overflow in multiplication presented for precision {precision}"
+        );
+
+        res
+    };
+
+    unary(lhs, op, lhs.data_type().clone())
+}
+
+/// Saturated division of two decimal primitive arrays with the same
+/// precision and scale. If the precision and scale is different, then an
+/// InvalidArgumentError is returned. If the result from the division is
+/// larger than the possible number with the selected precision then the
+/// resulted number in the arrow array is the maximum number for the selected
+/// precision. The function panics if divided by zero.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::decimal::saturating_div;
+/// use arrow2::array::PrimitiveArray;
+/// use arrow2::datatypes::DataType;
+///
+/// let a = PrimitiveArray::from([Some(999_99i128), Some(4_00i128), Some(6_00i128)]).to(DataType::Decimal(5, 2));
+/// let b = PrimitiveArray::from([Some(000_01i128), Some(2_00i128), Some(2_00i128)]).to(DataType::Decimal(5, 2));
+///
+/// let result = saturating_div(&a, &b);
+/// let expected = PrimitiveArray::from([Some(999_99i128), Some(2_00i128), Some(3_00i128)]).to(DataType::Decimal(5, 2));
+///
+/// assert_eq!(result, expected);
+/// ```
+pub fn saturating_div(
+    lhs: &PrimitiveArray<i128>,
+    rhs: &PrimitiveArray<i128>,
+) -> PrimitiveArray<i128> {
+    let (precision, scale) = get_parameters(lhs.data_type(), rhs.data_type()).unwrap();
+
+    let scale = 10i128.pow(scale as u32);
+    let max = max_value(precision);
+
+    let op = move |a: i128, b: i128| {
+        let numeral: i128 = a * scale;
+
+        match numeral.checked_div(b) {
+            Some(res) => match res {
+                res if res.abs() > max => {
+                    if res > 0 {
+                        max
+                    } else {
+                        -max
+                    }
+                },
+                _ => res,
+            },
+            None => 0,
+        }
+    };
+
+    binary(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+/// Checked division of two decimal primitive arrays with the same precision
+/// and scale. If the precision and scale is different, then an
+/// InvalidArgumentError is returned. If the divisor is zero, then the
+/// validity for that index is changed to None
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::decimal::checked_div;
+/// use arrow2::array::PrimitiveArray;
+/// use arrow2::datatypes::DataType;
+///
+/// let a = PrimitiveArray::from([Some(1_00i128), Some(4_00i128), Some(6_00i128)]).to(DataType::Decimal(5, 2));
+/// let b = PrimitiveArray::from([Some(000_00i128), None, Some(2_00i128)]).to(DataType::Decimal(5, 2));
+///
+/// let result = checked_div(&a, &b);
+/// let expected = PrimitiveArray::from([None, None, Some(3_00i128)]).to(DataType::Decimal(5, 2));
+///
+/// assert_eq!(result, expected);
+/// ```
+pub fn checked_div(lhs: &PrimitiveArray<i128>, rhs: &PrimitiveArray<i128>) -> PrimitiveArray<i128> {
+    let (precision, scale) = get_parameters(lhs.data_type(), rhs.data_type()).unwrap();
+
+    let scale = 10i128.pow(scale as u32);
+    let max = max_value(precision);
+
+    let op = move |a: i128, b: i128| {
+        let numeral: i128 = a * scale;
+
+        match numeral.checked_div(b) {
+            Some(res) => match res {
+                res if res.abs() > max => None,
+                _ => Some(res),
+            },
+            None => None,
+        }
+    };
+
+    binary_checked(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+// Implementation of ArrayDiv trait for PrimitiveArrays
+impl ArrayDiv<PrimitiveArray<i128>> for PrimitiveArray<i128> {
+    fn div(&self, rhs: &PrimitiveArray<i128>) -> Self {
+        div(self, rhs)
+    }
+}
+
+// Implementation of ArrayCheckedDiv trait for PrimitiveArrays
+impl ArrayCheckedDiv<PrimitiveArray<i128>> for PrimitiveArray<i128> {
+    fn checked_div(&self, rhs: &PrimitiveArray<i128>) -> Self {
+        checked_div(self, rhs)
+    }
+}
+
+/// Adaptive division of two decimal primitive arrays with different precision
+/// and scale. If the precision and scale is different, then the smallest scale
+/// and precision is adjusted to the largest precision and scale. If during the
+/// division one of the results is larger than the max possible value, the
+/// result precision is changed to the precision of the max value. The function
+/// panics when divided by zero.
+///
+/// ```nocode
+///  1000.00   -> 7, 2
+///    10.0000 -> 6, 4
+/// -----------------
+///   100.0000 -> 9, 4
+/// ```
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::decimal::adaptive_div;
+/// use arrow2::array::PrimitiveArray;
+/// use arrow2::datatypes::DataType;
+///
+/// let a = PrimitiveArray::from([Some(1000_00i128)]).to(DataType::Decimal(7, 2));
+/// let b = PrimitiveArray::from([Some(10_0000i128)]).to(DataType::Decimal(6, 4));
+/// let result = adaptive_div(&a, &b).unwrap();
+/// let expected = PrimitiveArray::from([Some(100_0000i128)]).to(DataType::Decimal(9, 4));
+///
+/// assert_eq!(result, expected);
+/// ```
+pub fn adaptive_div(
+    lhs: &PrimitiveArray<i128>,
+    rhs: &PrimitiveArray<i128>,
+) -> Result<PrimitiveArray<i128>> {
+    check_same_len(lhs, rhs)?;
+
+    let (lhs_p, lhs_s, rhs_p, rhs_s) =
+        if let (DataType::Decimal(lhs_p, lhs_s), DataType::Decimal(rhs_p, rhs_s)) =
+            (lhs.data_type(), rhs.data_type())
+        {
+            (*lhs_p, *lhs_s, *rhs_p, *rhs_s)
+        } else {
+            return Err(Error::InvalidArgumentError(
+                "Incorrect data type for the array".to_string(),
+            ));
+        };
+
+    // The resulting precision is mutable because it could change while
+    // looping through the iterator
+    let (mut res_p, res_s, diff) = adjusted_precision_scale(lhs_p, lhs_s, rhs_p, rhs_s);
+
+    let shift = 10i128.pow(diff as u32);
+    let shift_1 = 10i128.pow(res_s as u32);
+    let mut max = max_value(res_p);
+
+    let values = lhs
+        .values()
+        .iter()
+        .zip(rhs.values().iter())
+        .map(|(l, r)| {
+            let numeral: i128 = l * shift_1;
+
+            // Based on the array's scales one of the arguments in the sum has to be shifted
+            // to the left to match the final scale
+            let res = if lhs_s > rhs_s {
+                numeral.checked_div(r * shift)
+            } else {
+                (numeral * shift).checked_div(*r)
+            }
+            .expect("Found division by zero");
+
+            // The precision of the resulting array will change if one of the
+            // multiplications during the iteration produces a value bigger
+            // than the possible value for the initial precision
+
+            //  10.0000 -> 6, 4
+            //  00.1000 -> 6, 4
+            // -----------------
+            // 100.0000 -> 7, 4
+            if res.abs() > max {
+                res_p = number_digits(res);
+                max = max_value(res_p);
+            }
+
+            res
+        })
+        .collect::<Vec<_>>();
+
+    let validity = combine_validities(lhs.validity(), rhs.validity());
+
+    Ok(PrimitiveArray::<i128>::new(
+        DataType::Decimal(res_p, res_s),
+        values.into(),
+        validity,
+    ))
+}
diff --git a/crates/nano-arrow/src/compute/arithmetics/decimal/mod.rs b/crates/nano-arrow/src/compute/arithmetics/decimal/mod.rs
new file mode 100644
index 000000000000..4b412ef13c6e
--- /dev/null
+++ b/crates/nano-arrow/src/compute/arithmetics/decimal/mod.rs
@@ -0,0 +1,119 @@
+//! Defines the arithmetic kernels for Decimal `PrimitiveArrays`. The
+//! [`Decimal`](crate::datatypes::DataType::Decimal) type specifies the
+//! precision and scale parameters. These affect the arithmetic operations and
+//! need to be considered while doing operations with Decimal numbers.
+
+mod add;
+pub use add::*;
+mod div;
+pub use div::*;
+mod mul;
+pub use mul::*;
+mod sub;
+pub use sub::*;
+
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+
+/// Maximum value that can exist with a selected precision
+#[inline]
+fn max_value(precision: usize) -> i128 {
+    10i128.pow(precision as u32) - 1
+}
+
+// Calculates the number of digits in a i128 number
+fn number_digits(num: i128) -> usize {
+    let mut num = num.abs();
+    let mut digit: i128 = 0;
+    let base = 10i128;
+
+    while num != 0 {
+        num /= base;
+        digit += 1;
+    }
+
+    digit as usize
+}
+
+fn get_parameters(lhs: &DataType, rhs: &DataType) -> Result<(usize, usize)> {
+    if let (DataType::Decimal(lhs_p, lhs_s), DataType::Decimal(rhs_p, rhs_s)) =
+        (lhs.to_logical_type(), rhs.to_logical_type())
+    {
+        if lhs_p == rhs_p && lhs_s == rhs_s {
+            Ok((*lhs_p, *lhs_s))
+        } else {
+            Err(Error::InvalidArgumentError(
+                "Arrays must have the same precision and scale".to_string(),
+            ))
+        }
+    } else {
+        unreachable!()
+    }
+}
+
+/// Returns the adjusted precision and scale for the lhs and rhs precision and
+/// scale
+fn adjusted_precision_scale(
+    lhs_p: usize,
+    lhs_s: usize,
+    rhs_p: usize,
+    rhs_s: usize,
+) -> (usize, usize, usize) {
+    // The initial new precision and scale is based on the number of digits
+    // that lhs and rhs number has before and after the point. The max
+    // number of digits before and after the point will make the last
+    // precision and scale of the result
+
+    //                        Digits before/after point
+    //                        before    after
+    //    11.1111 -> 5, 4  ->   2        4
+    // 11111.01   -> 7, 2  ->   5        2
+    // -----------------
+    // 11122.1211 -> 9, 4  ->   5        4
+    let lhs_digits_before = lhs_p - lhs_s;
+    let rhs_digits_before = rhs_p - rhs_s;
+
+    let res_digits_before = std::cmp::max(lhs_digits_before, rhs_digits_before);
+
+    let (res_s, diff) = if lhs_s > rhs_s {
+        (lhs_s, lhs_s - rhs_s)
+    } else {
+        (rhs_s, rhs_s - lhs_s)
+    };
+
+    let res_p = res_digits_before + res_s;
+
+    (res_p, res_s, diff)
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn test_max_value() {
+        assert_eq!(999, max_value(3));
+        assert_eq!(99999, max_value(5));
+        assert_eq!(999999, max_value(6));
+    }
+
+    #[test]
+    fn test_number_digits() {
+        assert_eq!(2, number_digits(12i128));
+        assert_eq!(3, number_digits(123i128));
+        assert_eq!(4, number_digits(1234i128));
+        assert_eq!(6, number_digits(123456i128));
+        assert_eq!(7, number_digits(1234567i128));
+        assert_eq!(7, number_digits(-1234567i128));
+        assert_eq!(3, number_digits(-123i128));
+    }
+
+    #[test]
+    fn test_adjusted_precision_scale() {
+        //    11.1111 -> 5, 4  ->   2        4
+        // 11111.01   -> 7, 2  ->   5        2
+        // -----------------
+        // 11122.1211 -> 9, 4  ->   5        4
+        assert_eq!((9, 4, 2), adjusted_precision_scale(5, 4, 7, 2))
+    }
+}
diff --git a/crates/nano-arrow/src/compute/arithmetics/decimal/mul.rs b/crates/nano-arrow/src/compute/arithmetics/decimal/mul.rs
new file mode 100644
index 000000000000..a944279a133e
--- /dev/null
+++ b/crates/nano-arrow/src/compute/arithmetics/decimal/mul.rs
@@ -0,0 +1,314 @@
+//! Defines the multiplication arithmetic kernels for Decimal
+//! `PrimitiveArrays`.
+
+use super::{adjusted_precision_scale, get_parameters, max_value, number_digits};
+use crate::array::PrimitiveArray;
+use crate::compute::arithmetics::{ArrayCheckedMul, ArrayMul, ArraySaturatingMul};
+use crate::compute::arity::{binary, binary_checked, unary};
+use crate::compute::utils::{check_same_len, combine_validities};
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+use crate::scalar::{PrimitiveScalar, Scalar};
+
+/// Multiply two decimal primitive arrays with the same precision and scale. If
+/// the precision and scale is different, then an InvalidArgumentError is
+/// returned. This function panics if the multiplied numbers result in a number
+/// larger than the possible number for the selected precision.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::decimal::mul;
+/// use arrow2::array::PrimitiveArray;
+/// use arrow2::datatypes::DataType;
+///
+/// let a = PrimitiveArray::from([Some(1_00i128), Some(1_00i128), None, Some(2_00i128)]).to(DataType::Decimal(5, 2));
+/// let b = PrimitiveArray::from([Some(1_00i128), Some(2_00i128), None, Some(2_00i128)]).to(DataType::Decimal(5, 2));
+///
+/// let result = mul(&a, &b);
+/// let expected = PrimitiveArray::from([Some(1_00i128), Some(2_00i128), None, Some(4_00i128)]).to(DataType::Decimal(5, 2));
+///
+/// assert_eq!(result, expected);
+/// ```
+pub fn mul(lhs: &PrimitiveArray<i128>, rhs: &PrimitiveArray<i128>) -> PrimitiveArray<i128> {
+    let (precision, scale) = get_parameters(lhs.data_type(), rhs.data_type()).unwrap();
+
+    let scale = 10i128.pow(scale as u32);
+    let max = max_value(precision);
+
+    let op = move |a: i128, b: i128| {
+        // The multiplication between i128 can overflow if they are
+        // very large numbers. For that reason a checked
+        // multiplication is used.
+        let res: i128 = a.checked_mul(b).expect("Mayor overflow for multiplication");
+
+        // The multiplication is done using the numbers without scale.
+        // The resulting scale of the value has to be corrected by
+        // dividing by (10^scale)
+
+        //   111.111 -->      111111
+        //   222.222 -->      222222
+        // --------          -------
+        // 24691.308 <-- 24691308642
+        let res = res / scale;
+
+        assert!(
+            res.abs() <= max,
+            "Overflow in multiplication presented for precision {precision}"
+        );
+
+        res
+    };
+
+    binary(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+/// Multiply a decimal [`PrimitiveArray`] with a [`PrimitiveScalar`] with the same precision and scale. If
+/// the precision and scale is different, then an InvalidArgumentError is
+/// returned. This function panics if the multiplied numbers result in a number
+/// larger than the possible number for the selected precision.
+pub fn mul_scalar(lhs: &PrimitiveArray<i128>, rhs: &PrimitiveScalar<i128>) -> PrimitiveArray<i128> {
+    let (precision, scale) = get_parameters(lhs.data_type(), rhs.data_type()).unwrap();
+
+    let rhs = if let Some(rhs) = *rhs.value() {
+        rhs
+    } else {
+        return PrimitiveArray::<i128>::new_null(lhs.data_type().clone(), lhs.len());
+    };
+
+    let scale = 10i128.pow(scale as u32);
+    let max = max_value(precision);
+
+    let op = move |a: i128| {
+        // The multiplication between i128 can overflow if they are
+        // very large numbers. For that reason a checked
+        // multiplication is used.
+        let res: i128 = a
+            .checked_mul(rhs)
+            .expect("Mayor overflow for multiplication");
+
+        // The multiplication is done using the numbers without scale.
+        // The resulting scale of the value has to be corrected by
+        // dividing by (10^scale)
+
+        //   111.111 -->      111111
+        //   222.222 -->      222222
+        // --------          -------
+        // 24691.308 <-- 24691308642
+        let res = res / scale;
+
+        assert!(
+            res.abs() <= max,
+            "Overflow in multiplication presented for precision {precision}"
+        );
+
+        res
+    };
+
+    unary(lhs, op, lhs.data_type().clone())
+}
+
+/// Saturated multiplication of two decimal primitive arrays with the same
+/// precision and scale. If the precision and scale is different, then an
+/// InvalidArgumentError is returned. If the result from the multiplication is
+/// larger than the possible number with the selected precision then the
+/// resulted number in the arrow array is the maximum number for the selected
+/// precision.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::decimal::saturating_mul;
+/// use arrow2::array::PrimitiveArray;
+/// use arrow2::datatypes::DataType;
+///
+/// let a = PrimitiveArray::from([Some(999_99i128), Some(1_00i128), None, Some(2_00i128)]).to(DataType::Decimal(5, 2));
+/// let b = PrimitiveArray::from([Some(10_00i128), Some(2_00i128), None, Some(2_00i128)]).to(DataType::Decimal(5, 2));
+///
+/// let result = saturating_mul(&a, &b);
+/// let expected = PrimitiveArray::from([Some(999_99i128), Some(2_00i128), None, Some(4_00i128)]).to(DataType::Decimal(5, 2));
+///
+/// assert_eq!(result, expected);
+/// ```
+pub fn saturating_mul(
+    lhs: &PrimitiveArray<i128>,
+    rhs: &PrimitiveArray<i128>,
+) -> PrimitiveArray<i128> {
+    let (precision, scale) = get_parameters(lhs.data_type(), rhs.data_type()).unwrap();
+
+    let scale = 10i128.pow(scale as u32);
+    let max = max_value(precision);
+
+    let op = move |a: i128, b: i128| match a.checked_mul(b) {
+        Some(res) => {
+            let res = res / scale;
+
+            match res {
+                res if res.abs() > max => {
+                    if res > 0 {
+                        max
+                    } else {
+                        -max
+                    }
+                },
+                _ => res,
+            }
+        },
+        None => max,
+    };
+
+    binary(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+/// Checked multiplication of two decimal primitive arrays with the same
+/// precision and scale. If the precision and scale is different, then an
+/// InvalidArgumentError is returned. If the result from the mul is larger than
+/// the possible number with the selected precision (overflowing), then the
+/// validity for that index is changed to None
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::decimal::checked_mul;
+/// use arrow2::array::PrimitiveArray;
+/// use arrow2::datatypes::DataType;
+///
+/// let a = PrimitiveArray::from([Some(999_99i128), Some(1_00i128), None, Some(2_00i128)]).to(DataType::Decimal(5, 2));
+/// let b = PrimitiveArray::from([Some(10_00i128), Some(2_00i128), None, Some(2_00i128)]).to(DataType::Decimal(5, 2));
+///
+/// let result = checked_mul(&a, &b);
+/// let expected = PrimitiveArray::from([None, Some(2_00i128), None, Some(4_00i128)]).to(DataType::Decimal(5, 2));
+///
+/// assert_eq!(result, expected);
+/// ```
+pub fn checked_mul(lhs: &PrimitiveArray<i128>, rhs: &PrimitiveArray<i128>) -> PrimitiveArray<i128> {
+    let (precision, scale) = get_parameters(lhs.data_type(), rhs.data_type()).unwrap();
+
+    let scale = 10i128.pow(scale as u32);
+    let max = max_value(precision);
+
+    let op = move |a: i128, b: i128| match a.checked_mul(b) {
+        Some(res) => {
+            let res = res / scale;
+
+            match res {
+                res if res.abs() > max => None,
+                _ => Some(res),
+            }
+        },
+        None => None,
+    };
+
+    binary_checked(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+// Implementation of ArrayMul trait for PrimitiveArrays
+impl ArrayMul<PrimitiveArray<i128>> for PrimitiveArray<i128> {
+    fn mul(&self, rhs: &PrimitiveArray<i128>) -> Self {
+        mul(self, rhs)
+    }
+}
+
+// Implementation of ArrayCheckedMul trait for PrimitiveArrays
+impl ArrayCheckedMul<PrimitiveArray<i128>> for PrimitiveArray<i128> {
+    fn checked_mul(&self, rhs: &PrimitiveArray<i128>) -> Self {
+        checked_mul(self, rhs)
+    }
+}
+
+// Implementation of ArraySaturatingMul trait for PrimitiveArrays
+impl ArraySaturatingMul<PrimitiveArray<i128>> for PrimitiveArray<i128> {
+    fn saturating_mul(&self, rhs: &PrimitiveArray<i128>) -> Self {
+        saturating_mul(self, rhs)
+    }
+}
+
+/// Adaptive multiplication of two decimal primitive arrays with different
+/// precision and scale. If the precision and scale is different, then the
+/// smallest scale and precision is adjusted to the largest precision and
+/// scale. If during the multiplication one of the results is larger than the
+/// max possible value, the result precision is changed to the precision of the
+/// max value
+///
+/// ```nocode
+///   11111.0    -> 6, 1
+///      10.002  -> 5, 3
+/// -----------------
+///  111132.222  -> 9, 3
+/// ```
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::decimal::adaptive_mul;
+/// use arrow2::array::PrimitiveArray;
+/// use arrow2::datatypes::DataType;
+///
+/// let a = PrimitiveArray::from([Some(11111_0i128), Some(1_0i128)]).to(DataType::Decimal(6, 1));
+/// let b = PrimitiveArray::from([Some(10_002i128), Some(2_000i128)]).to(DataType::Decimal(5, 3));
+/// let result = adaptive_mul(&a, &b).unwrap();
+/// let expected = PrimitiveArray::from([Some(111132_222i128), Some(2_000i128)]).to(DataType::Decimal(9, 3));
+///
+/// assert_eq!(result, expected);
+/// ```
+pub fn adaptive_mul(
+    lhs: &PrimitiveArray<i128>,
+    rhs: &PrimitiveArray<i128>,
+) -> Result<PrimitiveArray<i128>> {
+    check_same_len(lhs, rhs)?;
+
+    let (lhs_p, lhs_s, rhs_p, rhs_s) =
+        if let (DataType::Decimal(lhs_p, lhs_s), DataType::Decimal(rhs_p, rhs_s)) =
+            (lhs.data_type(), rhs.data_type())
+        {
+            (*lhs_p, *lhs_s, *rhs_p, *rhs_s)
+        } else {
+            return Err(Error::InvalidArgumentError(
+                "Incorrect data type for the array".to_string(),
+            ));
+        };
+
+    // The resulting precision is mutable because it could change while
+    // looping through the iterator
+    let (mut res_p, res_s, diff) = adjusted_precision_scale(lhs_p, lhs_s, rhs_p, rhs_s);
+
+    let shift = 10i128.pow(diff as u32);
+    let shift_1 = 10i128.pow(res_s as u32);
+    let mut max = max_value(res_p);
+
+    let values = lhs
+        .values()
+        .iter()
+        .zip(rhs.values().iter())
+        .map(|(l, r)| {
+            // Based on the array's scales one of the arguments in the sum has to be shifted
+            // to the left to match the final scale
+            let res = if lhs_s > rhs_s {
+                l.checked_mul(r * shift)
+            } else {
+                (l * shift).checked_mul(*r)
+            }
+            .expect("Mayor overflow for multiplication");
+
+            let res = res / shift_1;
+
+            // The precision of the resulting array will change if one of the
+            // multiplications during the iteration produces a value bigger
+            // than the possible value for the initial precision
+
+            //  10.0000 -> 6, 4
+            //  10.0000 -> 6, 4
+            // -----------------
+            // 100.0000 -> 7, 4
+            if res.abs() > max {
+                res_p = number_digits(res);
+                max = max_value(res_p);
+            }
+
+            res
+        })
+        .collect::<Vec<_>>();
+
+    let validity = combine_validities(lhs.validity(), rhs.validity());
+
+    Ok(PrimitiveArray::<i128>::new(
+        DataType::Decimal(res_p, res_s),
+        values.into(),
+        validity,
+    ))
+}
diff --git a/crates/nano-arrow/src/compute/arithmetics/decimal/sub.rs b/crates/nano-arrow/src/compute/arithmetics/decimal/sub.rs
new file mode 100644
index 000000000000..2a0f7a72da17
--- /dev/null
+++ b/crates/nano-arrow/src/compute/arithmetics/decimal/sub.rs
@@ -0,0 +1,238 @@
+//! Defines the subtract arithmetic kernels for Decimal `PrimitiveArrays`.
+
+use super::{adjusted_precision_scale, get_parameters, max_value, number_digits};
+use crate::array::PrimitiveArray;
+use crate::compute::arithmetics::{ArrayCheckedSub, ArraySaturatingSub, ArraySub};
+use crate::compute::arity::{binary, binary_checked};
+use crate::compute::utils::{check_same_len, combine_validities};
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+
+/// Subtract two decimal primitive arrays with the same precision and scale. If
+/// the precision and scale is different, then an InvalidArgumentError is
+/// returned. This function panics if the subtracted numbers result in a number
+/// smaller than the possible number for the selected precision.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::decimal::sub;
+/// use arrow2::array::PrimitiveArray;
+/// use arrow2::datatypes::DataType;
+///
+/// let a = PrimitiveArray::from([Some(1i128), Some(1i128), None, Some(2i128)]).to(DataType::Decimal(5, 2));
+/// let b = PrimitiveArray::from([Some(1i128), Some(2i128), None, Some(2i128)]).to(DataType::Decimal(5, 2));
+///
+/// let result = sub(&a, &b);
+/// let expected = PrimitiveArray::from([Some(0i128), Some(-1i128), None, Some(0i128)]).to(DataType::Decimal(5, 2));
+///
+/// assert_eq!(result, expected);
+/// ```
+pub fn sub(lhs: &PrimitiveArray<i128>, rhs: &PrimitiveArray<i128>) -> PrimitiveArray<i128> {
+    let (precision, _) = get_parameters(lhs.data_type(), rhs.data_type()).unwrap();
+
+    let max = max_value(precision);
+
+    let op = move |a, b| {
+        let res: i128 = a - b;
+
+        assert!(
+            res.abs() <= max,
+            "Overflow in subtract presented for precision {precision}"
+        );
+
+        res
+    };
+
+    binary(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+/// Saturated subtraction of two decimal primitive arrays with the same
+/// precision and scale. If the precision and scale is different, then an
+/// InvalidArgumentError is returned. If the result from the sum is smaller
+/// than the possible number with the selected precision then the resulted
+/// number in the arrow array is the minimum number for the selected precision.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::decimal::saturating_sub;
+/// use arrow2::array::PrimitiveArray;
+/// use arrow2::datatypes::DataType;
+///
+/// let a = PrimitiveArray::from([Some(-99000i128), Some(11100i128), None, Some(22200i128)]).to(DataType::Decimal(5, 2));
+/// let b = PrimitiveArray::from([Some(01000i128), Some(22200i128), None, Some(11100i128)]).to(DataType::Decimal(5, 2));
+///
+/// let result = saturating_sub(&a, &b);
+/// let expected = PrimitiveArray::from([Some(-99999i128), Some(-11100i128), None, Some(11100i128)]).to(DataType::Decimal(5, 2));
+///
+/// assert_eq!(result, expected);
+/// ```
+pub fn saturating_sub(
+    lhs: &PrimitiveArray<i128>,
+    rhs: &PrimitiveArray<i128>,
+) -> PrimitiveArray<i128> {
+    let (precision, _) = get_parameters(lhs.data_type(), rhs.data_type()).unwrap();
+
+    let max = max_value(precision);
+
+    let op = move |a, b| {
+        let res: i128 = a - b;
+
+        match res {
+            res if res.abs() > max => {
+                if res > 0 {
+                    max
+                } else {
+                    -max
+                }
+            },
+            _ => res,
+        }
+    };
+
+    binary(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+// Implementation of ArraySub trait for PrimitiveArrays
+impl ArraySub<PrimitiveArray<i128>> for PrimitiveArray<i128> {
+    fn sub(&self, rhs: &PrimitiveArray<i128>) -> Self {
+        sub(self, rhs)
+    }
+}
+
+// Implementation of ArrayCheckedSub trait for PrimitiveArrays
+impl ArrayCheckedSub<PrimitiveArray<i128>> for PrimitiveArray<i128> {
+    fn checked_sub(&self, rhs: &PrimitiveArray<i128>) -> Self {
+        checked_sub(self, rhs)
+    }
+}
+
+// Implementation of ArraySaturatingSub trait for PrimitiveArrays
+impl ArraySaturatingSub<PrimitiveArray<i128>> for PrimitiveArray<i128> {
+    fn saturating_sub(&self, rhs: &PrimitiveArray<i128>) -> Self {
+        saturating_sub(self, rhs)
+    }
+}
+/// Checked subtract of two decimal primitive arrays with the same precision
+/// and scale. If the precision and scale is different, then an
+/// InvalidArgumentError is returned. If the result from the sub is larger than
+/// the possible number with the selected precision (overflowing), then the
+/// validity for that index is changed to None
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::decimal::checked_sub;
+/// use arrow2::array::PrimitiveArray;
+/// use arrow2::datatypes::DataType;
+///
+/// let a = PrimitiveArray::from([Some(-99000i128), Some(11100i128), None, Some(22200i128)]).to(DataType::Decimal(5, 2));
+/// let b = PrimitiveArray::from([Some(01000i128), Some(22200i128), None, Some(11100i128)]).to(DataType::Decimal(5, 2));
+///
+/// let result = checked_sub(&a, &b);
+/// let expected = PrimitiveArray::from([None, Some(-11100i128), None, Some(11100i128)]).to(DataType::Decimal(5, 2));
+///
+/// assert_eq!(result, expected);
+/// ```
+pub fn checked_sub(lhs: &PrimitiveArray<i128>, rhs: &PrimitiveArray<i128>) -> PrimitiveArray<i128> {
+    let (precision, _) = get_parameters(lhs.data_type(), rhs.data_type()).unwrap();
+
+    let max = max_value(precision);
+
+    let op = move |a, b| {
+        let res: i128 = a - b;
+
+        match res {
+            res if res.abs() > max => None,
+            _ => Some(res),
+        }
+    };
+
+    binary_checked(lhs, rhs, lhs.data_type().clone(), op)
+}
+
+/// Adaptive subtract of two decimal primitive arrays with different precision
+/// and scale. If the precision and scale is different, then the smallest scale
+/// and precision is adjusted to the largest precision and scale. If during the
+/// addition one of the results is smaller than the min possible value, the
+/// result precision is changed to the precision of the min value
+///
+/// ```nocode
+///  99.9999 -> 6, 4
+/// -00.0001 -> 6, 4
+/// -----------------
+/// 100.0000 -> 7, 4
+/// ```
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::decimal::adaptive_sub;
+/// use arrow2::array::PrimitiveArray;
+/// use arrow2::datatypes::DataType;
+///
+/// let a = PrimitiveArray::from([Some(99_9999i128)]).to(DataType::Decimal(6, 4));
+/// let b = PrimitiveArray::from([Some(-00_0001i128)]).to(DataType::Decimal(6, 4));
+/// let result = adaptive_sub(&a, &b).unwrap();
+/// let expected = PrimitiveArray::from([Some(100_0000i128)]).to(DataType::Decimal(7, 4));
+///
+/// assert_eq!(result, expected);
+/// ```
+pub fn adaptive_sub(
+    lhs: &PrimitiveArray<i128>,
+    rhs: &PrimitiveArray<i128>,
+) -> Result<PrimitiveArray<i128>> {
+    check_same_len(lhs, rhs)?;
+
+    let (lhs_p, lhs_s, rhs_p, rhs_s) =
+        if let (DataType::Decimal(lhs_p, lhs_s), DataType::Decimal(rhs_p, rhs_s)) =
+            (lhs.data_type(), rhs.data_type())
+        {
+            (*lhs_p, *lhs_s, *rhs_p, *rhs_s)
+        } else {
+            return Err(Error::InvalidArgumentError(
+                "Incorrect data type for the array".to_string(),
+            ));
+        };
+
+    // The resulting precision is mutable because it could change while
+    // looping through the iterator
+    let (mut res_p, res_s, diff) = adjusted_precision_scale(lhs_p, lhs_s, rhs_p, rhs_s);
+
+    let shift = 10i128.pow(diff as u32);
+    let mut max = max_value(res_p);
+
+    let values = lhs
+        .values()
+        .iter()
+        .zip(rhs.values().iter())
+        .map(|(l, r)| {
+            // Based on the array's scales one of the arguments in the sum has to be shifted
+            // to the left to match the final scale
+            let res: i128 = if lhs_s > rhs_s {
+                l - r * shift
+            } else {
+                l * shift - r
+            };
+
+            // The precision of the resulting array will change if one of the
+            // subtraction during the iteration produces a value bigger than the
+            // possible value for the initial precision
+
+            //  -99.9999 -> 6, 4
+            //   00.0001 -> 6, 4
+            // -----------------
+            // -100.0000 -> 7, 4
+            if res.abs() > max {
+                res_p = number_digits(res);
+                max = max_value(res_p);
+            }
+
+            res
+        })
+        .collect::<Vec<_>>();
+
+    let validity = combine_validities(lhs.validity(), rhs.validity());
+
+    Ok(PrimitiveArray::<i128>::new(
+        DataType::Decimal(res_p, res_s),
+        values.into(),
+        validity,
+    ))
+}
diff --git a/crates/nano-arrow/src/compute/arithmetics/mod.rs b/crates/nano-arrow/src/compute/arithmetics/mod.rs
new file mode 100644
index 000000000000..1d520e9ad644
--- /dev/null
+++ b/crates/nano-arrow/src/compute/arithmetics/mod.rs
@@ -0,0 +1,581 @@
+//! Defines basic arithmetic kernels for [`PrimitiveArray`](crate::array::PrimitiveArray)s.
+//!
+//! The Arithmetics module is composed by basic arithmetics operations that can
+//! be performed on [`PrimitiveArray`](crate::array::PrimitiveArray).
+//!
+//! Whenever possible, each operation declares variations
+//! of the basic operation that offers different guarantees:
+//! * plain: panics on overflowing and underflowing.
+//! * checked: turns an overflowing to a null.
+//! * saturating: turns the overflowing to the MAX or MIN value respectively.
+//! * overflowing: returns an extra [`Bitmap`] denoting whether the operation overflowed.
+//! * adaptive: for [`Decimal`](crate::datatypes::DataType::Decimal) only,
+//!   adjusts the precision and scale to make the resulting value fit.
+#[forbid(unsafe_code)]
+pub mod basic;
+#[cfg(feature = "compute_arithmetics_decimal")]
+pub mod decimal;
+pub mod time;
+
+use crate::array::{Array, DictionaryArray, PrimitiveArray};
+use crate::bitmap::Bitmap;
+use crate::datatypes::{DataType, IntervalUnit, TimeUnit};
+use crate::scalar::{PrimitiveScalar, Scalar};
+use crate::types::NativeType;
+
+fn binary_dyn<T: NativeType, F: Fn(&PrimitiveArray<T>, &PrimitiveArray<T>) -> PrimitiveArray<T>>(
+    lhs: &dyn Array,
+    rhs: &dyn Array,
+    op: F,
+) -> Box<dyn Array> {
+    let lhs = lhs.as_any().downcast_ref().unwrap();
+    let rhs = rhs.as_any().downcast_ref().unwrap();
+    op(lhs, rhs).boxed()
+}
+
+// Macro to create a `match` statement with dynamic dispatch to functions based on
+// the array's logical types
+macro_rules! arith {
+    ($lhs:expr, $rhs:expr, $op:tt $(, decimal = $op_decimal:tt )? $(, duration = $op_duration:tt )? $(, interval = $op_interval:tt )? $(, timestamp = $op_timestamp:tt )?) => {{
+        let lhs = $lhs;
+        let rhs = $rhs;
+        use DataType::*;
+        match (lhs.data_type(), rhs.data_type()) {
+            (Int8, Int8) => binary_dyn::<i8, _>(lhs, rhs, basic::$op),
+            (Int16, Int16) => binary_dyn::<i16, _>(lhs, rhs, basic::$op),
+            (Int32, Int32) => binary_dyn::<i32, _>(lhs, rhs, basic::$op),
+            (Int64, Int64) | (Duration(_), Duration(_)) => {
+                binary_dyn::<i64, _>(lhs, rhs, basic::$op)
+            }
+            (UInt8, UInt8) => binary_dyn::<u8, _>(lhs, rhs, basic::$op),
+            (UInt16, UInt16) => binary_dyn::<u16, _>(lhs, rhs, basic::$op),
+            (UInt32, UInt32) => binary_dyn::<u32, _>(lhs, rhs, basic::$op),
+            (UInt64, UInt64) => binary_dyn::<u64, _>(lhs, rhs, basic::$op),
+            (Float32, Float32) => binary_dyn::<f32, _>(lhs, rhs, basic::$op),
+            (Float64, Float64) => binary_dyn::<f64, _>(lhs, rhs, basic::$op),
+            $ (
+            (Decimal(_, _), Decimal(_, _)) => {
+                let lhs = lhs.as_any().downcast_ref().unwrap();
+                let rhs = rhs.as_any().downcast_ref().unwrap();
+                Box::new(decimal::$op_decimal(lhs, rhs)) as Box<dyn Array>
+            }
+            )?
+            $ (
+            (Time32(TimeUnit::Second), Duration(_))
+            | (Time32(TimeUnit::Millisecond), Duration(_))
+            | (Date32, Duration(_)) => {
+                let lhs = lhs.as_any().downcast_ref().unwrap();
+                let rhs = rhs.as_any().downcast_ref().unwrap();
+                Box::new(time::$op_duration::<i32>(lhs, rhs)) as Box<dyn Array>
+            }
+            (Time64(TimeUnit::Microsecond), Duration(_))
+            | (Time64(TimeUnit::Nanosecond), Duration(_))
+            | (Date64, Duration(_))
+            | (Timestamp(_, _), Duration(_)) => {
+                let lhs = lhs.as_any().downcast_ref().unwrap();
+                let rhs = rhs.as_any().downcast_ref().unwrap();
+                Box::new(time::$op_duration::<i64>(lhs, rhs)) as Box<dyn Array>
+            }
+            )?
+            $ (
+            (Timestamp(_, _), Interval(IntervalUnit::MonthDayNano)) => {
+                let lhs = lhs.as_any().downcast_ref().unwrap();
+                let rhs = rhs.as_any().downcast_ref().unwrap();
+                time::$op_interval(lhs, rhs).map(|x| Box::new(x) as Box<dyn Array>).unwrap()
+            }
+            )?
+            $ (
+            (Timestamp(_, None), Timestamp(_, None)) => {
+                let lhs = lhs.as_any().downcast_ref().unwrap();
+                let rhs = rhs.as_any().downcast_ref().unwrap();
+                time::$op_timestamp(lhs, rhs).map(|x| Box::new(x) as Box<dyn Array>).unwrap()
+            }
+            )?
+            _ => todo!(
+                "Addition of {:?} with {:?} is not supported",
+                lhs.data_type(),
+                rhs.data_type()
+            ),
+        }
+    }};
+}
+
+fn binary_scalar<T: NativeType, F: Fn(&PrimitiveArray<T>, &T) -> PrimitiveArray<T>>(
+    lhs: &PrimitiveArray<T>,
+    rhs: &PrimitiveScalar<T>,
+    op: F,
+) -> PrimitiveArray<T> {
+    let rhs = if let Some(rhs) = *rhs.value() {
+        rhs
+    } else {
+        return PrimitiveArray::<T>::new_null(lhs.data_type().clone(), lhs.len());
+    };
+    op(lhs, &rhs)
+}
+
+fn binary_scalar_dyn<T: NativeType, F: Fn(&PrimitiveArray<T>, &T) -> PrimitiveArray<T>>(
+    lhs: &dyn Array,
+    rhs: &dyn Scalar,
+    op: F,
+) -> Box<dyn Array> {
+    let lhs = lhs.as_any().downcast_ref().unwrap();
+    let rhs = rhs.as_any().downcast_ref().unwrap();
+    binary_scalar(lhs, rhs, op).boxed()
+}
+
+// Macro to create a `match` statement with dynamic dispatch to functions based on
+// the array's logical types
+macro_rules! arith_scalar {
+    ($lhs:expr, $rhs:expr, $op:tt $(, decimal = $op_decimal:tt )? $(, duration = $op_duration:tt )? $(, interval = $op_interval:tt )? $(, timestamp = $op_timestamp:tt )?) => {{
+        let lhs = $lhs;
+        let rhs = $rhs;
+        use DataType::*;
+        match (lhs.data_type(), rhs.data_type()) {
+            (Int8, Int8) => binary_scalar_dyn::<i8, _>(lhs, rhs, basic::$op),
+            (Int16, Int16) => binary_scalar_dyn::<i16, _>(lhs, rhs, basic::$op),
+            (Int32, Int32) => binary_scalar_dyn::<i32, _>(lhs, rhs, basic::$op),
+            (Int64, Int64) | (Duration(_), Duration(_)) => {
+                binary_scalar_dyn::<i64, _>(lhs, rhs, basic::$op)
+            }
+            (UInt8, UInt8) => binary_scalar_dyn::<u8, _>(lhs, rhs, basic::$op),
+            (UInt16, UInt16) => binary_scalar_dyn::<u16, _>(lhs, rhs, basic::$op),
+            (UInt32, UInt32) => binary_scalar_dyn::<u32, _>(lhs, rhs, basic::$op),
+            (UInt64, UInt64) => binary_scalar_dyn::<u64, _>(lhs, rhs, basic::$op),
+            (Float32, Float32) => binary_scalar_dyn::<f32, _>(lhs, rhs, basic::$op),
+            (Float64, Float64) => binary_scalar_dyn::<f64, _>(lhs, rhs, basic::$op),
+            $ (
+            (Decimal(_, _), Decimal(_, _)) => {
+                let lhs = lhs.as_any().downcast_ref().unwrap();
+                let rhs = rhs.as_any().downcast_ref().unwrap();
+                decimal::$op_decimal(lhs, rhs).boxed()
+            }
+            )?
+            $ (
+            (Time32(TimeUnit::Second), Duration(_))
+            | (Time32(TimeUnit::Millisecond), Duration(_))
+            | (Date32, Duration(_)) => {
+                let lhs = lhs.as_any().downcast_ref().unwrap();
+                let rhs = rhs.as_any().downcast_ref().unwrap();
+                time::$op_duration::<i32>(lhs, rhs).boxed()
+            }
+            (Time64(TimeUnit::Microsecond), Duration(_))
+            | (Time64(TimeUnit::Nanosecond), Duration(_))
+            | (Date64, Duration(_))
+            | (Timestamp(_, _), Duration(_)) => {
+                let lhs = lhs.as_any().downcast_ref().unwrap();
+                let rhs = rhs.as_any().downcast_ref().unwrap();
+                time::$op_duration::<i64>(lhs, rhs).boxed()
+            }
+            )?
+            $ (
+            (Timestamp(_, _), Interval(IntervalUnit::MonthDayNano)) => {
+                let lhs = lhs.as_any().downcast_ref().unwrap();
+                let rhs = rhs.as_any().downcast_ref().unwrap();
+                time::$op_interval(lhs, rhs).unwrap().boxed()
+            }
+            )?
+            $ (
+            (Timestamp(_, None), Timestamp(_, None)) => {
+                let lhs = lhs.as_any().downcast_ref().unwrap();
+                let rhs = rhs.as_any().downcast_ref().unwrap();
+                time::$op_timestamp(lhs, rhs).unwrap().boxed()
+            }
+            )?
+            _ => todo!(
+                "Addition of {:?} with {:?} is not supported",
+                lhs.data_type(),
+                rhs.data_type()
+            ),
+        }
+    }};
+}
+
+/// Adds two [`Array`]s.
+/// # Panic
+/// This function panics iff
+/// * the operation is not supported for the logical types (use [`can_add`] to check)
+/// * the arrays have a different length
+/// * one of the arrays is a timestamp with timezone and the timezone is not valid.
+pub fn add(lhs: &dyn Array, rhs: &dyn Array) -> Box<dyn Array> {
+    arith!(
+        lhs,
+        rhs,
+        add,
+        duration = add_duration,
+        interval = add_interval
+    )
+}
+
+/// Adds an [`Array`] and a [`Scalar`].
+/// # Panic
+/// This function panics iff
+/// * the operation is not supported for the logical types (use [`can_add`] to check)
+/// * the arrays have a different length
+/// * one of the arrays is a timestamp with timezone and the timezone is not valid.
+pub fn add_scalar(lhs: &dyn Array, rhs: &dyn Scalar) -> Box<dyn Array> {
+    arith_scalar!(
+        lhs,
+        rhs,
+        add_scalar,
+        duration = add_duration_scalar,
+        interval = add_interval_scalar
+    )
+}
+
+/// Returns whether two [`DataType`]s can be added by [`add`].
+pub fn can_add(lhs: &DataType, rhs: &DataType) -> bool {
+    use DataType::*;
+    matches!(
+        (lhs, rhs),
+        (Int8, Int8)
+            | (Int16, Int16)
+            | (Int32, Int32)
+            | (Int64, Int64)
+            | (UInt8, UInt8)
+            | (UInt16, UInt16)
+            | (UInt32, UInt32)
+            | (UInt64, UInt64)
+            | (Float64, Float64)
+            | (Float32, Float32)
+            | (Duration(_), Duration(_))
+            | (Decimal(_, _), Decimal(_, _))
+            | (Date32, Duration(_))
+            | (Date64, Duration(_))
+            | (Time32(TimeUnit::Millisecond), Duration(_))
+            | (Time32(TimeUnit::Second), Duration(_))
+            | (Time64(TimeUnit::Microsecond), Duration(_))
+            | (Time64(TimeUnit::Nanosecond), Duration(_))
+            | (Timestamp(_, _), Duration(_))
+            | (Timestamp(_, _), Interval(IntervalUnit::MonthDayNano))
+    )
+}
+
+/// Subtracts two [`Array`]s.
+/// # Panic
+/// This function panics iff
+/// * the operation is not supported for the logical types (use [`can_sub`] to check)
+/// * the arrays have a different length
+/// * one of the arrays is a timestamp with timezone and the timezone is not valid.
+pub fn sub(lhs: &dyn Array, rhs: &dyn Array) -> Box<dyn Array> {
+    arith!(
+        lhs,
+        rhs,
+        sub,
+        decimal = sub,
+        duration = subtract_duration,
+        timestamp = subtract_timestamps
+    )
+}
+
+/// Adds an [`Array`] and a [`Scalar`].
+/// # Panic
+/// This function panics iff
+/// * the operation is not supported for the logical types (use [`can_sub`] to check)
+/// * the arrays have a different length
+/// * one of the arrays is a timestamp with timezone and the timezone is not valid.
+pub fn sub_scalar(lhs: &dyn Array, rhs: &dyn Scalar) -> Box<dyn Array> {
+    arith_scalar!(
+        lhs,
+        rhs,
+        sub_scalar,
+        duration = sub_duration_scalar,
+        timestamp = sub_timestamps_scalar
+    )
+}
+
+/// Returns whether two [`DataType`]s can be subtracted by [`sub`].
+pub fn can_sub(lhs: &DataType, rhs: &DataType) -> bool {
+    use DataType::*;
+    matches!(
+        (lhs, rhs),
+        (Int8, Int8)
+            | (Int16, Int16)
+            | (Int32, Int32)
+            | (Int64, Int64)
+            | (UInt8, UInt8)
+            | (UInt16, UInt16)
+            | (UInt32, UInt32)
+            | (UInt64, UInt64)
+            | (Float64, Float64)
+            | (Float32, Float32)
+            | (Duration(_), Duration(_))
+            | (Decimal(_, _), Decimal(_, _))
+            | (Date32, Duration(_))
+            | (Date64, Duration(_))
+            | (Time32(TimeUnit::Millisecond), Duration(_))
+            | (Time32(TimeUnit::Second), Duration(_))
+            | (Time64(TimeUnit::Microsecond), Duration(_))
+            | (Time64(TimeUnit::Nanosecond), Duration(_))
+            | (Timestamp(_, _), Duration(_))
+            | (Timestamp(_, None), Timestamp(_, None))
+    )
+}
+
+/// Multiply two [`Array`]s.
+/// # Panic
+/// This function panics iff
+/// * the operation is not supported for the logical types (use [`can_mul`] to check)
+/// * the arrays have a different length
+pub fn mul(lhs: &dyn Array, rhs: &dyn Array) -> Box<dyn Array> {
+    arith!(lhs, rhs, mul, decimal = mul)
+}
+
+/// Multiply an [`Array`] with a [`Scalar`].
+/// # Panic
+/// This function panics iff
+/// * the operation is not supported for the logical types (use [`can_mul`] to check)
+pub fn mul_scalar(lhs: &dyn Array, rhs: &dyn Scalar) -> Box<dyn Array> {
+    arith_scalar!(lhs, rhs, mul_scalar, decimal = mul_scalar)
+}
+
+/// Returns whether two [`DataType`]s can be multiplied by [`mul`].
+pub fn can_mul(lhs: &DataType, rhs: &DataType) -> bool {
+    use DataType::*;
+    matches!(
+        (lhs, rhs),
+        (Int8, Int8)
+            | (Int16, Int16)
+            | (Int32, Int32)
+            | (Int64, Int64)
+            | (UInt8, UInt8)
+            | (UInt16, UInt16)
+            | (UInt32, UInt32)
+            | (UInt64, UInt64)
+            | (Float64, Float64)
+            | (Float32, Float32)
+            | (Decimal(_, _), Decimal(_, _))
+    )
+}
+
+/// Divide of two [`Array`]s.
+/// # Panic
+/// This function panics iff
+/// * the operation is not supported for the logical types (use [`can_div`] to check)
+/// * the arrays have a different length
+pub fn div(lhs: &dyn Array, rhs: &dyn Array) -> Box<dyn Array> {
+    arith!(lhs, rhs, div, decimal = div)
+}
+
+/// Divide an [`Array`] with a [`Scalar`].
+/// # Panic
+/// This function panics iff
+/// * the operation is not supported for the logical types (use [`can_div`] to check)
+pub fn div_scalar(lhs: &dyn Array, rhs: &dyn Scalar) -> Box<dyn Array> {
+    arith_scalar!(lhs, rhs, div_scalar, decimal = div_scalar)
+}
+
+/// Returns whether two [`DataType`]s can be divided by [`div`].
+pub fn can_div(lhs: &DataType, rhs: &DataType) -> bool {
+    can_mul(lhs, rhs)
+}
+
+/// Remainder of two [`Array`]s.
+/// # Panic
+/// This function panics iff
+/// * the operation is not supported for the logical types (use [`can_rem`] to check)
+/// * the arrays have a different length
+pub fn rem(lhs: &dyn Array, rhs: &dyn Array) -> Box<dyn Array> {
+    arith!(lhs, rhs, rem)
+}
+
+/// Returns whether two [`DataType`]s "can be remainder" by [`rem`].
+pub fn can_rem(lhs: &DataType, rhs: &DataType) -> bool {
+    use DataType::*;
+    matches!(
+        (lhs, rhs),
+        (Int8, Int8)
+            | (Int16, Int16)
+            | (Int32, Int32)
+            | (Int64, Int64)
+            | (UInt8, UInt8)
+            | (UInt16, UInt16)
+            | (UInt32, UInt32)
+            | (UInt64, UInt64)
+            | (Float64, Float64)
+            | (Float32, Float32)
+    )
+}
+
+macro_rules! with_match_negatable {(
+    $key_type:expr, | $_:tt $T:ident | $($body:tt)*
+) => ({
+    macro_rules! __with_ty__ {( $_ $T:ident ) => ( $($body)* )}
+    use crate::datatypes::PrimitiveType::*;
+    use crate::types::{days_ms, months_days_ns, i256};
+    match $key_type {
+        Int8 => __with_ty__! { i8 },
+        Int16 => __with_ty__! { i16 },
+        Int32 => __with_ty__! { i32 },
+        Int64 => __with_ty__! { i64 },
+        Int128 => __with_ty__! { i128 },
+        Int256 => __with_ty__! { i256 },
+        DaysMs => __with_ty__! { days_ms },
+        MonthDayNano => __with_ty__! { months_days_ns },
+        UInt8 | UInt16 | UInt32 | UInt64 | Float16 => todo!(),
+        Float32 => __with_ty__! { f32 },
+        Float64 => __with_ty__! { f64 },
+    }
+})}
+
+/// Negates an [`Array`].
+/// # Panic
+/// This function panics iff either
+/// * the operation is not supported for the logical type (use [`can_neg`] to check)
+/// * the operation overflows
+pub fn neg(array: &dyn Array) -> Box<dyn Array> {
+    use crate::datatypes::PhysicalType::*;
+    match array.data_type().to_physical_type() {
+        Primitive(primitive) => with_match_negatable!(primitive, |$T| {
+            let array = array.as_any().downcast_ref().unwrap();
+
+            let result = basic::negate::<$T>(array);
+            Box::new(result) as Box<dyn Array>
+        }),
+        Dictionary(key) => match_integer_type!(key, |$T| {
+            let array = array.as_any().downcast_ref::<DictionaryArray<$T>>().unwrap();
+
+            let values = neg(array.values().as_ref());
+
+            // safety - this operation only applies to values and thus preserves the dictionary's invariant
+            unsafe{
+                DictionaryArray::<$T>::try_new_unchecked(array.data_type().clone(), array.keys().clone(), values).unwrap().boxed()
+            }
+        }),
+        _ => todo!(),
+    }
+}
+
+/// Whether [`neg`] is supported for a given [`DataType`]
+pub fn can_neg(data_type: &DataType) -> bool {
+    if let DataType::Dictionary(_, values, _) = data_type.to_logical_type() {
+        return can_neg(values.as_ref());
+    }
+
+    use crate::datatypes::PhysicalType::*;
+    use crate::datatypes::PrimitiveType::*;
+    matches!(
+        data_type.to_physical_type(),
+        Primitive(Int8)
+            | Primitive(Int16)
+            | Primitive(Int32)
+            | Primitive(Int64)
+            | Primitive(Float64)
+            | Primitive(Float32)
+            | Primitive(DaysMs)
+            | Primitive(MonthDayNano)
+    )
+}
+
+/// Defines basic addition operation for primitive arrays
+pub trait ArrayAdd<Rhs>: Sized {
+    /// Adds itself to `rhs`
+    fn add(&self, rhs: &Rhs) -> Self;
+}
+
+/// Defines wrapping addition operation for primitive arrays
+pub trait ArrayWrappingAdd<Rhs>: Sized {
+    /// Adds itself to `rhs` using wrapping addition
+    fn wrapping_add(&self, rhs: &Rhs) -> Self;
+}
+
+/// Defines checked addition operation for primitive arrays
+pub trait ArrayCheckedAdd<Rhs>: Sized {
+    /// Checked add
+    fn checked_add(&self, rhs: &Rhs) -> Self;
+}
+
+/// Defines saturating addition operation for primitive arrays
+pub trait ArraySaturatingAdd<Rhs>: Sized {
+    /// Saturating add
+    fn saturating_add(&self, rhs: &Rhs) -> Self;
+}
+
+/// Defines Overflowing addition operation for primitive arrays
+pub trait ArrayOverflowingAdd<Rhs>: Sized {
+    /// Overflowing add
+    fn overflowing_add(&self, rhs: &Rhs) -> (Self, Bitmap);
+}
+
+/// Defines basic subtraction operation for primitive arrays
+pub trait ArraySub<Rhs>: Sized {
+    /// subtraction
+    fn sub(&self, rhs: &Rhs) -> Self;
+}
+
+/// Defines wrapping subtraction operation for primitive arrays
+pub trait ArrayWrappingSub<Rhs>: Sized {
+    /// wrapping subtraction
+    fn wrapping_sub(&self, rhs: &Rhs) -> Self;
+}
+
+/// Defines checked subtraction operation for primitive arrays
+pub trait ArrayCheckedSub<Rhs>: Sized {
+    /// checked subtraction
+    fn checked_sub(&self, rhs: &Rhs) -> Self;
+}
+
+/// Defines saturating subtraction operation for primitive arrays
+pub trait ArraySaturatingSub<Rhs>: Sized {
+    /// saturarting subtraction
+    fn saturating_sub(&self, rhs: &Rhs) -> Self;
+}
+
+/// Defines Overflowing subtraction operation for primitive arrays
+pub trait ArrayOverflowingSub<Rhs>: Sized {
+    /// overflowing subtraction
+    fn overflowing_sub(&self, rhs: &Rhs) -> (Self, Bitmap);
+}
+
+/// Defines basic multiplication operation for primitive arrays
+pub trait ArrayMul<Rhs>: Sized {
+    /// multiplication
+    fn mul(&self, rhs: &Rhs) -> Self;
+}
+
+/// Defines wrapping multiplication operation for primitive arrays
+pub trait ArrayWrappingMul<Rhs>: Sized {
+    /// wrapping multiplication
+    fn wrapping_mul(&self, rhs: &Rhs) -> Self;
+}
+
+/// Defines checked multiplication operation for primitive arrays
+pub trait ArrayCheckedMul<Rhs>: Sized {
+    /// checked multiplication
+    fn checked_mul(&self, rhs: &Rhs) -> Self;
+}
+
+/// Defines saturating multiplication operation for primitive arrays
+pub trait ArraySaturatingMul<Rhs>: Sized {
+    /// saturating multiplication
+    fn saturating_mul(&self, rhs: &Rhs) -> Self;
+}
+
+/// Defines Overflowing multiplication operation for primitive arrays
+pub trait ArrayOverflowingMul<Rhs>: Sized {
+    /// overflowing multiplication
+    fn overflowing_mul(&self, rhs: &Rhs) -> (Self, Bitmap);
+}
+
+/// Defines basic division operation for primitive arrays
+pub trait ArrayDiv<Rhs>: Sized {
+    /// division
+    fn div(&self, rhs: &Rhs) -> Self;
+}
+
+/// Defines checked division operation for primitive arrays
+pub trait ArrayCheckedDiv<Rhs>: Sized {
+    /// checked division
+    fn checked_div(&self, rhs: &Rhs) -> Self;
+}
+
+/// Defines basic reminder operation for primitive arrays
+pub trait ArrayRem<Rhs>: Sized {
+    /// remainder
+    fn rem(&self, rhs: &Rhs) -> Self;
+}
+
+/// Defines checked reminder operation for primitive arrays
+pub trait ArrayCheckedRem<Rhs>: Sized {
+    /// checked remainder
+    fn checked_rem(&self, rhs: &Rhs) -> Self;
+}
diff --git a/crates/nano-arrow/src/compute/arithmetics/time.rs b/crates/nano-arrow/src/compute/arithmetics/time.rs
new file mode 100644
index 000000000000..aa2e25e3ab0f
--- /dev/null
+++ b/crates/nano-arrow/src/compute/arithmetics/time.rs
@@ -0,0 +1,432 @@
+//! Defines the arithmetic kernels for adding a Duration to a Timestamp,
+//! Time32, Time64, Date32 and Date64.
+//!
+//! For the purposes of Arrow Implementations, adding this value to a Timestamp
+//! ("t1") naively (i.e. simply summing the two number) is acceptable even
+//! though in some cases the resulting Timestamp (t2) would not account for
+//! leap-seconds during the elapsed time between "t1" and "t2".  Similarly,
+//! representing the difference between two Unix timestamp is acceptable, but
+//! would yield a value that is possibly a few seconds off from the true
+//! elapsed time.
+
+use std::ops::{Add, Sub};
+
+use num_traits::AsPrimitive;
+
+use crate::array::PrimitiveArray;
+use crate::compute::arity::{binary, unary};
+use crate::datatypes::{DataType, TimeUnit};
+use crate::error::{Error, Result};
+use crate::scalar::{PrimitiveScalar, Scalar};
+use crate::temporal_conversions;
+use crate::types::{months_days_ns, NativeType};
+
+/// Creates the scale required to add or subtract a Duration to a time array
+/// (Timestamp, Time, or Date). The resulting scale always multiplies the rhs
+/// number (Duration) so it can be added to the lhs number (time array).
+fn create_scale(lhs: &DataType, rhs: &DataType) -> Result<f64> {
+    // Matching on both data types from both numbers to calculate the correct
+    // scale for the operation. The timestamp, Time and duration have a
+    // Timeunit enum in its data type. This enum is used to describe the
+    // addition of the duration. The Date32 and Date64 have different rules for
+    // the scaling.
+    let scale = match (lhs, rhs) {
+        (DataType::Timestamp(timeunit_a, _), DataType::Duration(timeunit_b))
+        | (DataType::Time32(timeunit_a), DataType::Duration(timeunit_b))
+        | (DataType::Time64(timeunit_a), DataType::Duration(timeunit_b)) => {
+            // The scale is based on the TimeUnit that each of the numbers have.
+            temporal_conversions::timeunit_scale(*timeunit_a, *timeunit_b)
+        },
+        (DataType::Date32, DataType::Duration(timeunit)) => {
+            // Date32 represents the time elapsed time since UNIX epoch
+            // (1970-01-01) in days (32 bits). The duration value has to be
+            // scaled to days to be able to add the value to the Date.
+            temporal_conversions::timeunit_scale(TimeUnit::Second, *timeunit)
+                / temporal_conversions::SECONDS_IN_DAY as f64
+        },
+        (DataType::Date64, DataType::Duration(timeunit)) => {
+            // Date64 represents the time elapsed time since UNIX epoch
+            // (1970-01-01) in milliseconds (64 bits). The duration value has
+            // to be scaled to milliseconds to be able to add the value to the
+            // Date.
+            temporal_conversions::timeunit_scale(TimeUnit::Millisecond, *timeunit)
+        },
+        _ => {
+            return Err(Error::InvalidArgumentError(
+                "Incorrect data type for the arguments".to_string(),
+            ));
+        },
+    };
+
+    Ok(scale)
+}
+
+/// Adds a duration to a time array (Timestamp, Time and Date). The timeunit
+/// enum is used to scale correctly both arrays; adding seconds with seconds,
+/// or milliseconds with milliseconds.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::time::add_duration;
+/// use arrow2::array::PrimitiveArray;
+/// use arrow2::datatypes::{DataType, TimeUnit};
+///
+/// let timestamp = PrimitiveArray::from([
+///     Some(100000i64),
+///     Some(200000i64),
+///     None,
+///     Some(300000i64),
+/// ])
+/// .to(DataType::Timestamp(
+///     TimeUnit::Second,
+///     Some("America/New_York".to_string()),
+/// ));
+///
+/// let duration = PrimitiveArray::from([Some(10i64), Some(20i64), None, Some(30i64)])
+///     .to(DataType::Duration(TimeUnit::Second));
+///
+/// let result = add_duration(&timestamp, &duration);
+/// let expected = PrimitiveArray::from([
+///     Some(100010i64),
+///     Some(200020i64),
+///     None,
+///     Some(300030i64),
+/// ])
+/// .to(DataType::Timestamp(
+///     TimeUnit::Second,
+///     Some("America/New_York".to_string()),
+/// ));
+///
+/// assert_eq!(result, expected);
+/// ```
+pub fn add_duration<T>(
+    time: &PrimitiveArray<T>,
+    duration: &PrimitiveArray<i64>,
+) -> PrimitiveArray<T>
+where
+    f64: AsPrimitive<T>,
+    T: NativeType + Add<T, Output = T>,
+{
+    let scale = create_scale(time.data_type(), duration.data_type()).unwrap();
+
+    // Closure for the binary operation. The closure contains the scale
+    // required to add a duration to the timestamp array.
+    let op = move |a: T, b: i64| a + (b as f64 * scale).as_();
+
+    binary(time, duration, time.data_type().clone(), op)
+}
+
+/// Adds a duration to a time array (Timestamp, Time and Date). The timeunit
+/// enum is used to scale correctly both arrays; adding seconds with seconds,
+/// or milliseconds with milliseconds.
+pub fn add_duration_scalar<T>(
+    time: &PrimitiveArray<T>,
+    duration: &PrimitiveScalar<i64>,
+) -> PrimitiveArray<T>
+where
+    f64: AsPrimitive<T>,
+    T: NativeType + Add<T, Output = T>,
+{
+    let scale = create_scale(time.data_type(), duration.data_type()).unwrap();
+    let duration = if let Some(duration) = *duration.value() {
+        duration
+    } else {
+        return PrimitiveArray::<T>::new_null(time.data_type().clone(), time.len());
+    };
+
+    // Closure for the binary operation. The closure contains the scale
+    // required to add a duration to the timestamp array.
+    let op = move |a: T| a + (duration as f64 * scale).as_();
+
+    unary(time, op, time.data_type().clone())
+}
+
+/// Subtract a duration to a time array (Timestamp, Time and Date). The timeunit
+/// enum is used to scale correctly both arrays; adding seconds with seconds,
+/// or milliseconds with milliseconds.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::time::subtract_duration;
+/// use arrow2::array::PrimitiveArray;
+/// use arrow2::datatypes::{DataType, TimeUnit};
+///
+/// let timestamp = PrimitiveArray::from([
+///     Some(100000i64),
+///     Some(200000i64),
+///     None,
+///     Some(300000i64),
+/// ])
+/// .to(DataType::Timestamp(
+///     TimeUnit::Second,
+///     Some("America/New_York".to_string()),
+/// ));
+///
+/// let duration = PrimitiveArray::from([Some(10i64), Some(20i64), None, Some(30i64)])
+///     .to(DataType::Duration(TimeUnit::Second));
+///
+/// let result = subtract_duration(&timestamp, &duration);
+/// let expected = PrimitiveArray::from([
+///     Some(99990i64),
+///     Some(199980i64),
+///     None,
+///     Some(299970i64),
+/// ])
+/// .to(DataType::Timestamp(
+///     TimeUnit::Second,
+///     Some("America/New_York".to_string()),
+/// ));
+///
+/// assert_eq!(result, expected);
+///
+/// ```
+pub fn subtract_duration<T>(
+    time: &PrimitiveArray<T>,
+    duration: &PrimitiveArray<i64>,
+) -> PrimitiveArray<T>
+where
+    f64: AsPrimitive<T>,
+    T: NativeType + Sub<T, Output = T>,
+{
+    let scale = create_scale(time.data_type(), duration.data_type()).unwrap();
+
+    // Closure for the binary operation. The closure contains the scale
+    // required to add a duration to the timestamp array.
+    let op = move |a: T, b: i64| a - (b as f64 * scale).as_();
+
+    binary(time, duration, time.data_type().clone(), op)
+}
+
+/// Subtract a duration to a time array (Timestamp, Time and Date). The timeunit
+/// enum is used to scale correctly both arrays; adding seconds with seconds,
+/// or milliseconds with milliseconds.
+pub fn sub_duration_scalar<T>(
+    time: &PrimitiveArray<T>,
+    duration: &PrimitiveScalar<i64>,
+) -> PrimitiveArray<T>
+where
+    f64: AsPrimitive<T>,
+    T: NativeType + Sub<T, Output = T>,
+{
+    let scale = create_scale(time.data_type(), duration.data_type()).unwrap();
+    let duration = if let Some(duration) = *duration.value() {
+        duration
+    } else {
+        return PrimitiveArray::<T>::new_null(time.data_type().clone(), time.len());
+    };
+
+    let op = move |a: T| a - (duration as f64 * scale).as_();
+
+    unary(time, op, time.data_type().clone())
+}
+
+/// Calculates the difference between two timestamps returning an array of type
+/// Duration. The timeunit enum is used to scale correctly both arrays;
+/// subtracting seconds with seconds, or milliseconds with milliseconds.
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::arithmetics::time::subtract_timestamps;
+/// use arrow2::array::PrimitiveArray;
+/// use arrow2::datatypes::{DataType, TimeUnit};
+/// let timestamp_a = PrimitiveArray::from([
+///     Some(100_010i64),
+///     Some(200_020i64),
+///     None,
+///     Some(300_030i64),
+/// ])
+/// .to(DataType::Timestamp(TimeUnit::Second, None));
+///
+/// let timestamp_b = PrimitiveArray::from([
+///     Some(100_000i64),
+///     Some(200_000i64),
+///     None,
+///     Some(300_000i64),
+/// ])
+/// .to(DataType::Timestamp(TimeUnit::Second, None));
+///
+/// let expected = PrimitiveArray::from([Some(10i64), Some(20i64), None, Some(30i64)])
+///     .to(DataType::Duration(TimeUnit::Second));
+///
+/// let result = subtract_timestamps(&timestamp_a, &&timestamp_b).unwrap();
+/// assert_eq!(result, expected);
+/// ```
+pub fn subtract_timestamps(
+    lhs: &PrimitiveArray<i64>,
+    rhs: &PrimitiveArray<i64>,
+) -> Result<PrimitiveArray<i64>> {
+    // Matching on both data types from both arrays.
+    // Both timestamps have a Timeunit enum in its data type.
+    // This enum is used to adjust the scale between the timestamps.
+    match (lhs.data_type(), rhs.data_type()) {
+        // Naive timestamp comparison. It doesn't take into account timezones
+        // from the Timestamp timeunit.
+        (DataType::Timestamp(timeunit_a, None), DataType::Timestamp(timeunit_b, None)) => {
+            // Closure for the binary operation. The closure contains the scale
+            // required to calculate the difference between the timestamps.
+            let scale = temporal_conversions::timeunit_scale(*timeunit_a, *timeunit_b);
+            let op = move |a, b| a - (b as f64 * scale) as i64;
+
+            Ok(binary(lhs, rhs, DataType::Duration(*timeunit_a), op))
+        },
+        _ => Err(Error::InvalidArgumentError(
+            "Incorrect data type for the arguments".to_string(),
+        )),
+    }
+}
+
+/// Calculates the difference between two timestamps as [`DataType::Duration`] with the same time scale.
+pub fn sub_timestamps_scalar(
+    lhs: &PrimitiveArray<i64>,
+    rhs: &PrimitiveScalar<i64>,
+) -> Result<PrimitiveArray<i64>> {
+    let (scale, timeunit_a) =
+        if let (DataType::Timestamp(timeunit_a, None), DataType::Timestamp(timeunit_b, None)) =
+            (lhs.data_type(), rhs.data_type())
+        {
+            (
+                temporal_conversions::timeunit_scale(*timeunit_a, *timeunit_b),
+                timeunit_a,
+            )
+        } else {
+            return Err(Error::InvalidArgumentError(
+                "sub_timestamps_scalar requires both arguments to be timestamps without timezone"
+                    .to_string(),
+            ));
+        };
+
+    let rhs = if let Some(value) = *rhs.value() {
+        value
+    } else {
+        return Ok(PrimitiveArray::<i64>::new_null(
+            lhs.data_type().clone(),
+            lhs.len(),
+        ));
+    };
+
+    let op = move |a| a - (rhs as f64 * scale) as i64;
+
+    Ok(unary(lhs, op, DataType::Duration(*timeunit_a)))
+}
+
+/// Adds an interval to a [`DataType::Timestamp`].
+pub fn add_interval(
+    timestamp: &PrimitiveArray<i64>,
+    interval: &PrimitiveArray<months_days_ns>,
+) -> Result<PrimitiveArray<i64>> {
+    match timestamp.data_type().to_logical_type() {
+        DataType::Timestamp(time_unit, Some(timezone_str)) => {
+            let time_unit = *time_unit;
+            let timezone = temporal_conversions::parse_offset(timezone_str);
+            match timezone {
+                Ok(timezone) => Ok(binary(
+                    timestamp,
+                    interval,
+                    timestamp.data_type().clone(),
+                    |timestamp, interval| {
+                        temporal_conversions::add_interval(
+                            timestamp, time_unit, interval, &timezone,
+                        )
+                    },
+                )),
+                #[cfg(feature = "chrono-tz")]
+                Err(_) => {
+                    let timezone = temporal_conversions::parse_offset_tz(timezone_str)?;
+                    Ok(binary(
+                        timestamp,
+                        interval,
+                        timestamp.data_type().clone(),
+                        |timestamp, interval| {
+                            temporal_conversions::add_interval(
+                                timestamp, time_unit, interval, &timezone,
+                            )
+                        },
+                    ))
+                },
+                #[cfg(not(feature = "chrono-tz"))]
+                _ => Err(Error::InvalidArgumentError(format!(
+                    "timezone \"{}\" cannot be parsed (feature chrono-tz is not active)",
+                    timezone_str
+                ))),
+            }
+        },
+        DataType::Timestamp(time_unit, None) => {
+            let time_unit = *time_unit;
+            Ok(binary(
+                timestamp,
+                interval,
+                timestamp.data_type().clone(),
+                |timestamp, interval| {
+                    temporal_conversions::add_naive_interval(timestamp, time_unit, interval)
+                },
+            ))
+        },
+        _ => Err(Error::InvalidArgumentError(
+            "Adding an interval is only supported for `DataType::Timestamp`".to_string(),
+        )),
+    }
+}
+
+/// Adds an interval to a [`DataType::Timestamp`].
+pub fn add_interval_scalar(
+    timestamp: &PrimitiveArray<i64>,
+    interval: &PrimitiveScalar<months_days_ns>,
+) -> Result<PrimitiveArray<i64>> {
+    let interval = if let Some(interval) = *interval.value() {
+        interval
+    } else {
+        return Ok(PrimitiveArray::<i64>::new_null(
+            timestamp.data_type().clone(),
+            timestamp.len(),
+        ));
+    };
+
+    match timestamp.data_type().to_logical_type() {
+        DataType::Timestamp(time_unit, Some(timezone_str)) => {
+            let time_unit = *time_unit;
+            let timezone = temporal_conversions::parse_offset(timezone_str);
+            match timezone {
+                Ok(timezone) => Ok(unary(
+                    timestamp,
+                    |timestamp| {
+                        temporal_conversions::add_interval(
+                            timestamp, time_unit, interval, &timezone,
+                        )
+                    },
+                    timestamp.data_type().clone(),
+                )),
+                #[cfg(feature = "chrono-tz")]
+                Err(_) => {
+                    let timezone = temporal_conversions::parse_offset_tz(timezone_str)?;
+                    Ok(unary(
+                        timestamp,
+                        |timestamp| {
+                            temporal_conversions::add_interval(
+                                timestamp, time_unit, interval, &timezone,
+                            )
+                        },
+                        timestamp.data_type().clone(),
+                    ))
+                },
+                #[cfg(not(feature = "chrono-tz"))]
+                _ => Err(Error::InvalidArgumentError(format!(
+                    "timezone \"{}\" cannot be parsed (feature chrono-tz is not active)",
+                    timezone_str
+                ))),
+            }
+        },
+        DataType::Timestamp(time_unit, None) => {
+            let time_unit = *time_unit;
+            Ok(unary(
+                timestamp,
+                |timestamp| {
+                    temporal_conversions::add_naive_interval(timestamp, time_unit, interval)
+                },
+                timestamp.data_type().clone(),
+            ))
+        },
+        _ => Err(Error::InvalidArgumentError(
+            "Adding an interval is only supported for `DataType::Timestamp`".to_string(),
+        )),
+    }
+}
diff --git a/crates/nano-arrow/src/compute/arity.rs b/crates/nano-arrow/src/compute/arity.rs
new file mode 100644
index 000000000000..935970ccdf75
--- /dev/null
+++ b/crates/nano-arrow/src/compute/arity.rs
@@ -0,0 +1,279 @@
+//! Defines kernels suitable to perform operations to primitive arrays.
+
+use super::utils::{check_same_len, combine_validities};
+use crate::array::PrimitiveArray;
+use crate::bitmap::{Bitmap, MutableBitmap};
+use crate::datatypes::DataType;
+use crate::error::Result;
+use crate::types::NativeType;
+
+/// Applies an unary and infallible function to a [`PrimitiveArray`]. This is the
+/// fastest way to perform an operation on a [`PrimitiveArray`] when the benefits
+/// of a vectorized operation outweighs the cost of branching nulls and
+/// non-nulls.
+///
+/// # Implementation
+/// This will apply the function for all values, including those on null slots.
+/// This implies that the operation must be infallible for any value of the
+/// corresponding type or this function may panic.
+#[inline]
+pub fn unary<I, F, O>(array: &PrimitiveArray<I>, op: F, data_type: DataType) -> PrimitiveArray<O>
+where
+    I: NativeType,
+    O: NativeType,
+    F: Fn(I) -> O,
+{
+    let values = array.values().iter().map(|v| op(*v)).collect::<Vec<_>>();
+
+    PrimitiveArray::<O>::new(data_type, values.into(), array.validity().cloned())
+}
+
+/// Version of unary that checks for errors in the closure used to create the
+/// buffer
+pub fn try_unary<I, F, O>(
+    array: &PrimitiveArray<I>,
+    op: F,
+    data_type: DataType,
+) -> Result<PrimitiveArray<O>>
+where
+    I: NativeType,
+    O: NativeType,
+    F: Fn(I) -> Result<O>,
+{
+    let values = array
+        .values()
+        .iter()
+        .map(|v| op(*v))
+        .collect::<Result<Vec<_>>>()?
+        .into();
+
+    Ok(PrimitiveArray::<O>::new(
+        data_type,
+        values,
+        array.validity().cloned(),
+    ))
+}
+
+/// Version of unary that returns an array and bitmap. Used when working with
+/// overflowing operations
+pub fn unary_with_bitmap<I, F, O>(
+    array: &PrimitiveArray<I>,
+    op: F,
+    data_type: DataType,
+) -> (PrimitiveArray<O>, Bitmap)
+where
+    I: NativeType,
+    O: NativeType,
+    F: Fn(I) -> (O, bool),
+{
+    let mut mut_bitmap = MutableBitmap::with_capacity(array.len());
+
+    let values = array
+        .values()
+        .iter()
+        .map(|v| {
+            let (res, over) = op(*v);
+            mut_bitmap.push(over);
+            res
+        })
+        .collect::<Vec<_>>()
+        .into();
+
+    (
+        PrimitiveArray::<O>::new(data_type, values, array.validity().cloned()),
+        mut_bitmap.into(),
+    )
+}
+
+/// Version of unary that creates a mutable bitmap that is used to keep track
+/// of checked operations. The resulting bitmap is compared with the array
+/// bitmap to create the final validity array.
+pub fn unary_checked<I, F, O>(
+    array: &PrimitiveArray<I>,
+    op: F,
+    data_type: DataType,
+) -> PrimitiveArray<O>
+where
+    I: NativeType,
+    O: NativeType,
+    F: Fn(I) -> Option<O>,
+{
+    let mut mut_bitmap = MutableBitmap::with_capacity(array.len());
+
+    let values = array
+        .values()
+        .iter()
+        .map(|v| match op(*v) {
+            Some(val) => {
+                mut_bitmap.push(true);
+                val
+            },
+            None => {
+                mut_bitmap.push(false);
+                O::default()
+            },
+        })
+        .collect::<Vec<_>>()
+        .into();
+
+    // The validity has to be checked against the bitmap created during the
+    // creation of the values with the iterator. If an error was found during
+    // the iteration, then the validity is changed to None to mark the value
+    // as Null
+    let bitmap: Bitmap = mut_bitmap.into();
+    let validity = combine_validities(array.validity(), Some(&bitmap));
+
+    PrimitiveArray::<O>::new(data_type, values, validity)
+}
+
+/// Applies a binary operations to two primitive arrays. This is the fastest
+/// way to perform an operation on two primitive array when the benefits of a
+/// vectorized operation outweighs the cost of branching nulls and non-nulls.
+/// # Errors
+/// This function errors iff the arrays have a different length.
+/// # Implementation
+/// This will apply the function for all values, including those on null slots.
+/// This implies that the operation must be infallible for any value of the
+/// corresponding type.
+/// The types of the arrays are not checked with this operation. The closure
+/// "op" needs to handle the different types in the arrays. The datatype for the
+/// resulting array has to be selected by the implementer of the function as
+/// an argument for the function.
+#[inline]
+pub fn binary<T, D, F>(
+    lhs: &PrimitiveArray<T>,
+    rhs: &PrimitiveArray<D>,
+    data_type: DataType,
+    op: F,
+) -> PrimitiveArray<T>
+where
+    T: NativeType,
+    D: NativeType,
+    F: Fn(T, D) -> T,
+{
+    check_same_len(lhs, rhs).unwrap();
+
+    let validity = combine_validities(lhs.validity(), rhs.validity());
+
+    let values = lhs
+        .values()
+        .iter()
+        .zip(rhs.values().iter())
+        .map(|(l, r)| op(*l, *r))
+        .collect::<Vec<_>>()
+        .into();
+
+    PrimitiveArray::<T>::new(data_type, values, validity)
+}
+
+/// Version of binary that checks for errors in the closure used to create the
+/// buffer
+pub fn try_binary<T, D, F>(
+    lhs: &PrimitiveArray<T>,
+    rhs: &PrimitiveArray<D>,
+    data_type: DataType,
+    op: F,
+) -> Result<PrimitiveArray<T>>
+where
+    T: NativeType,
+    D: NativeType,
+    F: Fn(T, D) -> Result<T>,
+{
+    check_same_len(lhs, rhs)?;
+
+    let validity = combine_validities(lhs.validity(), rhs.validity());
+
+    let values = lhs
+        .values()
+        .iter()
+        .zip(rhs.values().iter())
+        .map(|(l, r)| op(*l, *r))
+        .collect::<Result<Vec<_>>>()?
+        .into();
+
+    Ok(PrimitiveArray::<T>::new(data_type, values, validity))
+}
+
+/// Version of binary that returns an array and bitmap. Used when working with
+/// overflowing operations
+pub fn binary_with_bitmap<T, D, F>(
+    lhs: &PrimitiveArray<T>,
+    rhs: &PrimitiveArray<D>,
+    data_type: DataType,
+    op: F,
+) -> (PrimitiveArray<T>, Bitmap)
+where
+    T: NativeType,
+    D: NativeType,
+    F: Fn(T, D) -> (T, bool),
+{
+    check_same_len(lhs, rhs).unwrap();
+
+    let validity = combine_validities(lhs.validity(), rhs.validity());
+
+    let mut mut_bitmap = MutableBitmap::with_capacity(lhs.len());
+
+    let values = lhs
+        .values()
+        .iter()
+        .zip(rhs.values().iter())
+        .map(|(l, r)| {
+            let (res, over) = op(*l, *r);
+            mut_bitmap.push(over);
+            res
+        })
+        .collect::<Vec<_>>()
+        .into();
+
+    (
+        PrimitiveArray::<T>::new(data_type, values, validity),
+        mut_bitmap.into(),
+    )
+}
+
+/// Version of binary that creates a mutable bitmap that is used to keep track
+/// of checked operations. The resulting bitmap is compared with the array
+/// bitmap to create the final validity array.
+pub fn binary_checked<T, D, F>(
+    lhs: &PrimitiveArray<T>,
+    rhs: &PrimitiveArray<D>,
+    data_type: DataType,
+    op: F,
+) -> PrimitiveArray<T>
+where
+    T: NativeType,
+    D: NativeType,
+    F: Fn(T, D) -> Option<T>,
+{
+    check_same_len(lhs, rhs).unwrap();
+
+    let mut mut_bitmap = MutableBitmap::with_capacity(lhs.len());
+
+    let values = lhs
+        .values()
+        .iter()
+        .zip(rhs.values().iter())
+        .map(|(l, r)| match op(*l, *r) {
+            Some(val) => {
+                mut_bitmap.push(true);
+                val
+            },
+            None => {
+                mut_bitmap.push(false);
+                T::default()
+            },
+        })
+        .collect::<Vec<_>>()
+        .into();
+
+    let bitmap: Bitmap = mut_bitmap.into();
+    let validity = combine_validities(lhs.validity(), rhs.validity());
+
+    // The validity has to be checked against the bitmap created during the
+    // creation of the values with the iterator. If an error was found during
+    // the iteration, then the validity is changed to None to mark the value
+    // as Null
+    let validity = combine_validities(validity.as_ref(), Some(&bitmap));
+
+    PrimitiveArray::<T>::new(data_type, values, validity)
+}
diff --git a/crates/nano-arrow/src/compute/arity_assign.rs b/crates/nano-arrow/src/compute/arity_assign.rs
new file mode 100644
index 000000000000..e1b358d8aebb
--- /dev/null
+++ b/crates/nano-arrow/src/compute/arity_assign.rs
@@ -0,0 +1,96 @@
+//! Defines generics suitable to perform operations to [`PrimitiveArray`] in-place.
+
+use either::Either;
+
+use super::utils::check_same_len;
+use crate::array::PrimitiveArray;
+use crate::types::NativeType;
+
+/// Applies an unary function to a [`PrimitiveArray`], optionally in-place.
+///
+/// # Implementation
+/// This function tries to apply the function directly to the values of the array.
+/// If that region is shared, this function creates a new region and writes to it.
+///
+/// # Panics
+/// This function panics iff
+/// * the arrays have a different length.
+/// * the function itself panics.
+#[inline]
+pub fn unary<I, F>(array: &mut PrimitiveArray<I>, op: F)
+where
+    I: NativeType,
+    F: Fn(I) -> I,
+{
+    if let Some(values) = array.get_mut_values() {
+        // mutate in place
+        values.iter_mut().for_each(|l| *l = op(*l));
+    } else {
+        // alloc and write to new region
+        let values = array.values().iter().map(|l| op(*l)).collect::<Vec<_>>();
+        array.set_values(values.into());
+    }
+}
+
+/// Applies a binary function to two [`PrimitiveArray`]s, optionally in-place, returning
+/// a new [`PrimitiveArray`].
+///
+/// # Implementation
+/// This function tries to apply the function directly to the values of the array.
+/// If that region is shared, this function creates a new region and writes to it.
+/// # Panics
+/// This function panics iff
+/// * the arrays have a different length.
+/// * the function itself panics.
+#[inline]
+pub fn binary<T, D, F>(lhs: &mut PrimitiveArray<T>, rhs: &PrimitiveArray<D>, op: F)
+where
+    T: NativeType,
+    D: NativeType,
+    F: Fn(T, D) -> T,
+{
+    check_same_len(lhs, rhs).unwrap();
+
+    // both for the validity and for the values
+    // we branch to check if we can mutate in place
+    // if we can, great that is fastest.
+    // if we cannot, we allocate a new buffer and assign values to that
+    // new buffer, that is benchmarked to be ~2x faster than first memcpy and assign in place
+    // for the validity bits it can be much faster as we might need to iterate all bits if the
+    // bitmap has an offset.
+    if let Some(rhs) = rhs.validity() {
+        if lhs.validity().is_none() {
+            lhs.set_validity(Some(rhs.clone()));
+        } else {
+            lhs.apply_validity(|bitmap| {
+                match bitmap.into_mut() {
+                    Either::Left(immutable) => {
+                        // alloc new region
+                        &immutable & rhs
+                    },
+                    Either::Right(mutable) => {
+                        // mutate in place
+                        (mutable & rhs).into()
+                    },
+                }
+            });
+        }
+    };
+
+    if let Some(values) = lhs.get_mut_values() {
+        // mutate values in place
+        values
+            .iter_mut()
+            .zip(rhs.values().iter())
+            .for_each(|(l, r)| *l = op(*l, *r));
+    } else {
+        // alloc new region
+        let values = lhs
+            .values()
+            .iter()
+            .zip(rhs.values().iter())
+            .map(|(l, r)| op(*l, *r))
+            .collect::<Vec<_>>();
+        lhs.set_values(values.into());
+    }
+}
diff --git a/crates/nano-arrow/src/compute/bitwise.rs b/crates/nano-arrow/src/compute/bitwise.rs
new file mode 100644
index 000000000000..37c26542b848
--- /dev/null
+++ b/crates/nano-arrow/src/compute/bitwise.rs
@@ -0,0 +1,75 @@
+//! Contains bitwise operators: [`or`], [`and`], [`xor`] and [`not`].
+use std::ops::{BitAnd, BitOr, BitXor, Not};
+
+use crate::array::PrimitiveArray;
+use crate::compute::arity::{binary, unary};
+use crate::types::NativeType;
+
+/// Performs `OR` operation on two [`PrimitiveArray`]s.
+/// # Panic
+/// This function errors when the arrays have different lengths.
+pub fn or<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> PrimitiveArray<T>
+where
+    T: NativeType + BitOr<Output = T>,
+{
+    binary(lhs, rhs, lhs.data_type().clone(), |a, b| a | b)
+}
+
+/// Performs `XOR` operation between two [`PrimitiveArray`]s.
+/// # Panic
+/// This function errors when the arrays have different lengths.
+pub fn xor<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> PrimitiveArray<T>
+where
+    T: NativeType + BitXor<Output = T>,
+{
+    binary(lhs, rhs, lhs.data_type().clone(), |a, b| a ^ b)
+}
+
+/// Performs `AND` operation on two [`PrimitiveArray`]s.
+/// # Panic
+/// This function panics when the arrays have different lengths.
+pub fn and<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> PrimitiveArray<T>
+where
+    T: NativeType + BitAnd<Output = T>,
+{
+    binary(lhs, rhs, lhs.data_type().clone(), |a, b| a & b)
+}
+
+/// Returns a new [`PrimitiveArray`] with the bitwise `not`.
+pub fn not<T>(array: &PrimitiveArray<T>) -> PrimitiveArray<T>
+where
+    T: NativeType + Not<Output = T>,
+{
+    let op = move |a: T| !a;
+    unary(array, op, array.data_type().clone())
+}
+
+/// Performs `OR` operation between a [`PrimitiveArray`] and scalar.
+/// # Panic
+/// This function errors when the arrays have different lengths.
+pub fn or_scalar<T>(lhs: &PrimitiveArray<T>, rhs: &T) -> PrimitiveArray<T>
+where
+    T: NativeType + BitOr<Output = T>,
+{
+    unary(lhs, |a| a | *rhs, lhs.data_type().clone())
+}
+
+/// Performs `XOR` operation between a [`PrimitiveArray`] and scalar.
+/// # Panic
+/// This function errors when the arrays have different lengths.
+pub fn xor_scalar<T>(lhs: &PrimitiveArray<T>, rhs: &T) -> PrimitiveArray<T>
+where
+    T: NativeType + BitXor<Output = T>,
+{
+    unary(lhs, |a| a ^ *rhs, lhs.data_type().clone())
+}
+
+/// Performs `AND` operation between a [`PrimitiveArray`] and scalar.
+/// # Panic
+/// This function panics when the arrays have different lengths.
+pub fn and_scalar<T>(lhs: &PrimitiveArray<T>, rhs: &T) -> PrimitiveArray<T>
+where
+    T: NativeType + BitAnd<Output = T>,
+{
+    unary(lhs, |a| a & *rhs, lhs.data_type().clone())
+}
diff --git a/crates/nano-arrow/src/compute/boolean.rs b/crates/nano-arrow/src/compute/boolean.rs
new file mode 100644
index 000000000000..daf6853c3c29
--- /dev/null
+++ b/crates/nano-arrow/src/compute/boolean.rs
@@ -0,0 +1,288 @@
+//! null-preserving operators such as [`and`], [`or`] and [`not`].
+use super::utils::combine_validities;
+use crate::array::{Array, BooleanArray};
+use crate::bitmap::{Bitmap, MutableBitmap};
+use crate::datatypes::DataType;
+use crate::scalar::BooleanScalar;
+
+fn assert_lengths(lhs: &BooleanArray, rhs: &BooleanArray) {
+    assert_eq!(
+        lhs.len(),
+        rhs.len(),
+        "lhs and rhs must have the same length"
+    );
+}
+
+/// Helper function to implement binary kernels
+pub(crate) fn binary_boolean_kernel<F>(
+    lhs: &BooleanArray,
+    rhs: &BooleanArray,
+    op: F,
+) -> BooleanArray
+where
+    F: Fn(&Bitmap, &Bitmap) -> Bitmap,
+{
+    assert_lengths(lhs, rhs);
+    let validity = combine_validities(lhs.validity(), rhs.validity());
+
+    let left_buffer = lhs.values();
+    let right_buffer = rhs.values();
+
+    let values = op(left_buffer, right_buffer);
+
+    BooleanArray::new(DataType::Boolean, values, validity)
+}
+
+/// Performs `&&` operation on two [`BooleanArray`], combining the validities.
+/// # Panics
+/// This function panics iff the arrays have different lengths.
+/// # Examples
+/// ```rust
+/// use arrow2::array::BooleanArray;
+/// use arrow2::compute::boolean::and;
+///
+/// let a = BooleanArray::from(&[Some(false), Some(true), None]);
+/// let b = BooleanArray::from(&[Some(true), Some(true), Some(false)]);
+/// let and_ab = and(&a, &b);
+/// assert_eq!(and_ab, BooleanArray::from(&[Some(false), Some(true), None]));
+/// ```
+pub fn and(lhs: &BooleanArray, rhs: &BooleanArray) -> BooleanArray {
+    if lhs.null_count() == 0 && rhs.null_count() == 0 {
+        let left_buffer = lhs.values();
+        let right_buffer = rhs.values();
+
+        match (left_buffer.unset_bits(), right_buffer.unset_bits()) {
+            // all values are `true` on both sides
+            (0, 0) => {
+                assert_lengths(lhs, rhs);
+                return lhs.clone();
+            },
+            // all values are `false` on left side
+            (l, _) if l == lhs.len() => {
+                assert_lengths(lhs, rhs);
+                return lhs.clone();
+            },
+            // all values are `false` on right side
+            (_, r) if r == rhs.len() => {
+                assert_lengths(lhs, rhs);
+                return rhs.clone();
+            },
+            // ignore the rest
+            _ => {},
+        }
+    }
+
+    binary_boolean_kernel(lhs, rhs, |lhs, rhs| lhs & rhs)
+}
+
+/// Performs `||` operation on two [`BooleanArray`], combining the validities.
+/// # Panics
+/// This function panics iff the arrays have different lengths.
+/// # Examples
+/// ```rust
+/// use arrow2::array::BooleanArray;
+/// use arrow2::compute::boolean::or;
+///
+/// let a = BooleanArray::from(vec![Some(false), Some(true), None]);
+/// let b = BooleanArray::from(vec![Some(true), Some(true), Some(false)]);
+/// let or_ab = or(&a, &b);
+/// assert_eq!(or_ab, BooleanArray::from(vec![Some(true), Some(true), None]));
+/// ```
+pub fn or(lhs: &BooleanArray, rhs: &BooleanArray) -> BooleanArray {
+    if lhs.null_count() == 0 && rhs.null_count() == 0 {
+        let left_buffer = lhs.values();
+        let right_buffer = rhs.values();
+
+        match (left_buffer.unset_bits(), right_buffer.unset_bits()) {
+            // all values are `true` on left side
+            (0, _) => {
+                assert_lengths(lhs, rhs);
+                return lhs.clone();
+            },
+            // all values are `true` on right side
+            (_, 0) => {
+                assert_lengths(lhs, rhs);
+                return rhs.clone();
+            },
+            // all values on lhs and rhs are `false`
+            (l, r) if l == lhs.len() && r == rhs.len() => {
+                assert_lengths(lhs, rhs);
+                return rhs.clone();
+            },
+            // ignore the rest
+            _ => {},
+        }
+    }
+
+    binary_boolean_kernel(lhs, rhs, |lhs, rhs| lhs | rhs)
+}
+
+/// Performs unary `NOT` operation on an arrays. If value is null then the result is also
+/// null.
+/// # Example
+/// ```rust
+/// use arrow2::array::BooleanArray;
+/// use arrow2::compute::boolean::not;
+///
+/// let a = BooleanArray::from(vec![Some(false), Some(true), None]);
+/// let not_a = not(&a);
+/// assert_eq!(not_a, BooleanArray::from(vec![Some(true), Some(false), None]));
+/// ```
+pub fn not(array: &BooleanArray) -> BooleanArray {
+    let values = !array.values();
+    let validity = array.validity().cloned();
+    BooleanArray::new(DataType::Boolean, values, validity)
+}
+
+/// Returns a non-null [`BooleanArray`] with whether each value of the array is null.
+/// # Example
+/// ```rust
+/// use arrow2::array::BooleanArray;
+/// use arrow2::compute::boolean::is_null;
+/// # fn main() {
+/// let a = BooleanArray::from(vec![Some(false), Some(true), None]);
+/// let a_is_null = is_null(&a);
+/// assert_eq!(a_is_null, BooleanArray::from_slice(vec![false, false, true]));
+/// # }
+/// ```
+pub fn is_null(input: &dyn Array) -> BooleanArray {
+    let len = input.len();
+
+    let values = match input.validity() {
+        None => MutableBitmap::from_len_zeroed(len).into(),
+        Some(buffer) => !buffer,
+    };
+
+    BooleanArray::new(DataType::Boolean, values, None)
+}
+
+/// Returns a non-null [`BooleanArray`] with whether each value of the array is not null.
+/// # Example
+/// ```rust
+/// use arrow2::array::BooleanArray;
+/// use arrow2::compute::boolean::is_not_null;
+///
+/// let a = BooleanArray::from(&vec![Some(false), Some(true), None]);
+/// let a_is_not_null = is_not_null(&a);
+/// assert_eq!(a_is_not_null, BooleanArray::from_slice(&vec![true, true, false]));
+/// ```
+pub fn is_not_null(input: &dyn Array) -> BooleanArray {
+    let values = match input.validity() {
+        None => {
+            let mut mutable = MutableBitmap::new();
+            mutable.extend_constant(input.len(), true);
+            mutable.into()
+        },
+        Some(buffer) => buffer.clone(),
+    };
+    BooleanArray::new(DataType::Boolean, values, None)
+}
+
+/// Performs `AND` operation on an array and a scalar value. If either left or right value
+/// is null then the result is also null.
+/// # Example
+/// ```rust
+/// use arrow2::array::BooleanArray;
+/// use arrow2::compute::boolean::and_scalar;
+/// use arrow2::scalar::BooleanScalar;
+///
+/// let array = BooleanArray::from_slice(&[false, false, true, true]);
+/// let scalar = BooleanScalar::new(Some(true));
+/// let result = and_scalar(&array, &scalar);
+/// assert_eq!(result, BooleanArray::from_slice(&[false, false, true, true]));
+///
+/// ```
+pub fn and_scalar(array: &BooleanArray, scalar: &BooleanScalar) -> BooleanArray {
+    match scalar.value() {
+        Some(true) => array.clone(),
+        Some(false) => {
+            let values = Bitmap::new_zeroed(array.len());
+            BooleanArray::new(DataType::Boolean, values, array.validity().cloned())
+        },
+        None => BooleanArray::new_null(DataType::Boolean, array.len()),
+    }
+}
+
+/// Performs `OR` operation on an array and a scalar value. If either left or right value
+/// is null then the result is also null.
+/// # Example
+/// ```rust
+/// use arrow2::array::BooleanArray;
+/// use arrow2::compute::boolean::or_scalar;
+/// use arrow2::scalar::BooleanScalar;
+/// # fn main() {
+/// let array = BooleanArray::from_slice(&[false, false, true, true]);
+/// let scalar = BooleanScalar::new(Some(true));
+/// let result = or_scalar(&array, &scalar);
+/// assert_eq!(result, BooleanArray::from_slice(&[true, true, true, true]));
+/// # }
+/// ```
+pub fn or_scalar(array: &BooleanArray, scalar: &BooleanScalar) -> BooleanArray {
+    match scalar.value() {
+        Some(true) => {
+            let mut values = MutableBitmap::new();
+            values.extend_constant(array.len(), true);
+            BooleanArray::new(DataType::Boolean, values.into(), array.validity().cloned())
+        },
+        Some(false) => array.clone(),
+        None => BooleanArray::new_null(DataType::Boolean, array.len()),
+    }
+}
+
+/// Returns whether any of the values in the array are `true`.
+///
+/// Null values are ignored.
+///
+/// # Example
+///
+/// ```
+/// use arrow2::array::BooleanArray;
+/// use arrow2::compute::boolean::any;
+///
+/// let a = BooleanArray::from(&[Some(true), Some(false)]);
+/// let b = BooleanArray::from(&[Some(false), Some(false)]);
+/// let c = BooleanArray::from(&[None, Some(false)]);
+///
+/// assert_eq!(any(&a), true);
+/// assert_eq!(any(&b), false);
+/// assert_eq!(any(&c), false);
+/// ```
+pub fn any(array: &BooleanArray) -> bool {
+    if array.is_empty() {
+        false
+    } else if array.null_count() > 0 {
+        array.into_iter().any(|v| v == Some(true))
+    } else {
+        let vals = array.values();
+        vals.unset_bits() != vals.len()
+    }
+}
+
+/// Returns whether all values in the array are `true`.
+///
+/// Null values are ignored.
+///
+/// # Example
+///
+/// ```
+/// use arrow2::array::BooleanArray;
+/// use arrow2::compute::boolean::all;
+///
+/// let a = BooleanArray::from(&[Some(true), Some(true)]);
+/// let b = BooleanArray::from(&[Some(false), Some(true)]);
+/// let c = BooleanArray::from(&[None, Some(true)]);
+///
+/// assert_eq!(all(&a), true);
+/// assert_eq!(all(&b), false);
+/// assert_eq!(all(&c), true);
+/// ```
+pub fn all(array: &BooleanArray) -> bool {
+    if array.is_empty() {
+        true
+    } else if array.null_count() > 0 {
+        !array.into_iter().any(|v| v == Some(false))
+    } else {
+        let vals = array.values();
+        vals.unset_bits() == 0
+    }
+}
diff --git a/crates/nano-arrow/src/compute/boolean_kleene.rs b/crates/nano-arrow/src/compute/boolean_kleene.rs
new file mode 100644
index 000000000000..2983c2e31ded
--- /dev/null
+++ b/crates/nano-arrow/src/compute/boolean_kleene.rs
@@ -0,0 +1,301 @@
+//! Boolean operators of [Kleene logic](https://en.wikipedia.org/wiki/Three-valued_logic#Kleene_and_Priest_logics).
+use crate::array::{Array, BooleanArray};
+use crate::bitmap::{binary, quaternary, ternary, unary, Bitmap, MutableBitmap};
+use crate::datatypes::DataType;
+use crate::scalar::BooleanScalar;
+
+/// Logical 'or' operation on two arrays with [Kleene logic](https://en.wikipedia.org/wiki/Three-valued_logic#Kleene_and_Priest_logics)
+/// # Panics
+/// This function panics iff the arrays have a different length
+/// # Example
+///
+/// ```rust
+/// use arrow2::array::BooleanArray;
+/// use arrow2::compute::boolean_kleene::or;
+///
+/// let a = BooleanArray::from(&[Some(true), Some(false), None]);
+/// let b = BooleanArray::from(&[None, None, None]);
+/// let or_ab = or(&a, &b);
+/// assert_eq!(or_ab, BooleanArray::from(&[Some(true), None, None]));
+/// ```
+pub fn or(lhs: &BooleanArray, rhs: &BooleanArray) -> BooleanArray {
+    assert_eq!(
+        lhs.len(),
+        rhs.len(),
+        "lhs and rhs must have the same length"
+    );
+
+    let lhs_values = lhs.values();
+    let rhs_values = rhs.values();
+
+    let lhs_validity = lhs.validity();
+    let rhs_validity = rhs.validity();
+
+    let validity = match (lhs_validity, rhs_validity) {
+        (Some(lhs_validity), Some(rhs_validity)) => {
+            Some(quaternary(
+                lhs_values,
+                rhs_values,
+                lhs_validity,
+                rhs_validity,
+                // see https://en.wikipedia.org/wiki/Three-valued_logic#Kleene_and_Priest_logics
+                |lhs, rhs, lhs_v, rhs_v| {
+                    // A = T
+                    (lhs & lhs_v) |
+                    // B = T
+                    (rhs & rhs_v) |
+                    // A = F & B = F
+                    (!lhs & lhs_v) & (!rhs & rhs_v)
+                },
+            ))
+        },
+        (Some(lhs_validity), None) => {
+            // B != U
+            Some(ternary(
+                lhs_values,
+                rhs_values,
+                lhs_validity,
+                // see https://en.wikipedia.org/wiki/Three-valued_logic#Kleene_and_Priest_logics
+                |lhs, rhs, lhs_v| {
+                    // A = T
+                    (lhs & lhs_v) |
+                    // B = T
+                    rhs |
+                    // A = F & B = F
+                    (!lhs & lhs_v) & !rhs
+                },
+            ))
+        },
+        (None, Some(rhs_validity)) => {
+            Some(ternary(
+                lhs_values,
+                rhs_values,
+                rhs_validity,
+                // see https://en.wikipedia.org/wiki/Three-valued_logic#Kleene_and_Priest_logics
+                |lhs, rhs, rhs_v| {
+                    // A = T
+                    lhs |
+                    // B = T
+                    (rhs & rhs_v) |
+                    // A = F & B = F
+                    !lhs & (!rhs & rhs_v)
+                },
+            ))
+        },
+        (None, None) => None,
+    };
+    BooleanArray::new(DataType::Boolean, lhs_values | rhs_values, validity)
+}
+
+/// Logical 'and' operation on two arrays with [Kleene logic](https://en.wikipedia.org/wiki/Three-valued_logic#Kleene_and_Priest_logics)
+/// # Panics
+/// This function panics iff the arrays have a different length
+/// # Example
+///
+/// ```rust
+/// use arrow2::array::BooleanArray;
+/// use arrow2::compute::boolean_kleene::and;
+///
+/// let a = BooleanArray::from(&[Some(true), Some(false), None]);
+/// let b = BooleanArray::from(&[None, None, None]);
+/// let and_ab = and(&a, &b);
+/// assert_eq!(and_ab, BooleanArray::from(&[None, Some(false), None]));
+/// ```
+pub fn and(lhs: &BooleanArray, rhs: &BooleanArray) -> BooleanArray {
+    assert_eq!(
+        lhs.len(),
+        rhs.len(),
+        "lhs and rhs must have the same length"
+    );
+
+    let lhs_values = lhs.values();
+    let rhs_values = rhs.values();
+
+    let lhs_validity = lhs.validity();
+    let rhs_validity = rhs.validity();
+
+    let validity = match (lhs_validity, rhs_validity) {
+        (Some(lhs_validity), Some(rhs_validity)) => {
+            Some(quaternary(
+                lhs_values,
+                rhs_values,
+                lhs_validity,
+                rhs_validity,
+                // see https://en.wikipedia.org/wiki/Three-valued_logic#Kleene_and_Priest_logics
+                |lhs, rhs, lhs_v, rhs_v| {
+                    // B = F
+                    (!rhs & rhs_v) |
+                    // A = F
+                    (!lhs & lhs_v) |
+                    // A = T & B = T
+                    (lhs & lhs_v) & (rhs & rhs_v)
+                },
+            ))
+        },
+        (Some(lhs_validity), None) => {
+            Some(ternary(
+                lhs_values,
+                rhs_values,
+                lhs_validity,
+                // see https://en.wikipedia.org/wiki/Three-valued_logic#Kleene_and_Priest_logics
+                |lhs, rhs, lhs_v| {
+                    // B = F
+                    !rhs |
+                    // A = F
+                    (!lhs & lhs_v) |
+                    // A = T & B = T
+                    (lhs & lhs_v) & rhs
+                },
+            ))
+        },
+        (None, Some(rhs_validity)) => {
+            Some(ternary(
+                lhs_values,
+                rhs_values,
+                rhs_validity,
+                // see https://en.wikipedia.org/wiki/Three-valued_logic#Kleene_and_Priest_logics
+                |lhs, rhs, rhs_v| {
+                    // B = F
+                    (!rhs & rhs_v) |
+                    // A = F
+                    !lhs |
+                    // A = T & B = T
+                    lhs & (rhs & rhs_v)
+                },
+            ))
+        },
+        (None, None) => None,
+    };
+    BooleanArray::new(DataType::Boolean, lhs_values & rhs_values, validity)
+}
+
+/// Logical 'or' operation on an array and a scalar value with [Kleene logic](https://en.wikipedia.org/wiki/Three-valued_logic#Kleene_and_Priest_logics)
+/// # Example
+///
+/// ```rust
+/// use arrow2::array::BooleanArray;
+/// use arrow2::scalar::BooleanScalar;
+/// use arrow2::compute::boolean_kleene::or_scalar;
+///
+/// let array = BooleanArray::from(&[Some(true), Some(false), None]);
+/// let scalar = BooleanScalar::new(Some(false));
+/// let result = or_scalar(&array, &scalar);
+/// assert_eq!(result, BooleanArray::from(&[Some(true), Some(false), None]));
+/// ```
+pub fn or_scalar(array: &BooleanArray, scalar: &BooleanScalar) -> BooleanArray {
+    match scalar.value() {
+        Some(true) => {
+            let mut values = MutableBitmap::new();
+            values.extend_constant(array.len(), true);
+            BooleanArray::new(DataType::Boolean, values.into(), None)
+        },
+        Some(false) => array.clone(),
+        None => {
+            let values = array.values();
+            let validity = match array.validity() {
+                Some(validity) => binary(values, validity, |value, validity| validity & value),
+                None => unary(values, |value| value),
+            };
+            BooleanArray::new(DataType::Boolean, values.clone(), Some(validity))
+        },
+    }
+}
+
+/// Logical 'and' operation on an array and a scalar value with [Kleene logic](https://en.wikipedia.org/wiki/Three-valued_logic#Kleene_and_Priest_logics)
+/// # Example
+///
+/// ```rust
+/// use arrow2::array::BooleanArray;
+/// use arrow2::scalar::BooleanScalar;
+/// use arrow2::compute::boolean_kleene::and_scalar;
+///
+/// let array = BooleanArray::from(&[Some(true), Some(false), None]);
+/// let scalar = BooleanScalar::new(None);
+/// let result = and_scalar(&array, &scalar);
+/// assert_eq!(result, BooleanArray::from(&[None, Some(false), None]));
+/// ```
+pub fn and_scalar(array: &BooleanArray, scalar: &BooleanScalar) -> BooleanArray {
+    match scalar.value() {
+        Some(true) => array.clone(),
+        Some(false) => {
+            let values = Bitmap::new_zeroed(array.len());
+            BooleanArray::new(DataType::Boolean, values, None)
+        },
+        None => {
+            let values = array.values();
+            let validity = match array.validity() {
+                Some(validity) => binary(values, validity, |value, validity| validity & !value),
+                None => unary(values, |value| !value),
+            };
+            BooleanArray::new(DataType::Boolean, array.values().clone(), Some(validity))
+        },
+    }
+}
+
+/// Returns whether any of the values in the array are `true`.
+///
+/// The output is unknown (`None`) if the array contains any null values and
+/// no `true` values.
+///
+/// # Example
+///
+/// ```
+/// use arrow2::array::BooleanArray;
+/// use arrow2::compute::boolean_kleene::any;
+///
+/// let a = BooleanArray::from(&[Some(true), Some(false)]);
+/// let b = BooleanArray::from(&[Some(false), Some(false)]);
+/// let c = BooleanArray::from(&[None, Some(false)]);
+///
+/// assert_eq!(any(&a), Some(true));
+/// assert_eq!(any(&b), Some(false));
+/// assert_eq!(any(&c), None);
+/// ```
+pub fn any(array: &BooleanArray) -> Option<bool> {
+    if array.is_empty() {
+        Some(false)
+    } else if array.null_count() > 0 {
+        if array.into_iter().any(|v| v == Some(true)) {
+            Some(true)
+        } else {
+            None
+        }
+    } else {
+        let vals = array.values();
+        Some(vals.unset_bits() != vals.len())
+    }
+}
+
+/// Returns whether all values in the array are `true`.
+///
+/// The output is unknown (`None`) if the array contains any null values and
+/// no `false` values.
+///
+/// # Example
+///
+/// ```
+/// use arrow2::array::BooleanArray;
+/// use arrow2::compute::boolean_kleene::all;
+///
+/// let a = BooleanArray::from(&[Some(true), Some(true)]);
+/// let b = BooleanArray::from(&[Some(false), Some(true)]);
+/// let c = BooleanArray::from(&[None, Some(true)]);
+///
+/// assert_eq!(all(&a), Some(true));
+/// assert_eq!(all(&b), Some(false));
+/// assert_eq!(all(&c), None);
+/// ```
+pub fn all(array: &BooleanArray) -> Option<bool> {
+    if array.is_empty() {
+        Some(true)
+    } else if array.null_count() > 0 {
+        if array.into_iter().any(|v| v == Some(false)) {
+            Some(false)
+        } else {
+            None
+        }
+    } else {
+        let vals = array.values();
+        Some(vals.unset_bits() == 0)
+    }
+}
diff --git a/crates/nano-arrow/src/compute/cast/binary_to.rs b/crates/nano-arrow/src/compute/cast/binary_to.rs
new file mode 100644
index 000000000000..52038f9caefa
--- /dev/null
+++ b/crates/nano-arrow/src/compute/cast/binary_to.rs
@@ -0,0 +1,159 @@
+use super::CastOptions;
+use crate::array::*;
+use crate::datatypes::DataType;
+use crate::error::Result;
+use crate::offset::{Offset, Offsets};
+use crate::types::NativeType;
+
+/// Conversion of binary
+pub fn binary_to_large_binary(from: &BinaryArray<i32>, to_data_type: DataType) -> BinaryArray<i64> {
+    let values = from.values().clone();
+    BinaryArray::<i64>::new(
+        to_data_type,
+        from.offsets().into(),
+        values,
+        from.validity().cloned(),
+    )
+}
+
+/// Conversion of binary
+pub fn binary_large_to_binary(
+    from: &BinaryArray<i64>,
+    to_data_type: DataType,
+) -> Result<BinaryArray<i32>> {
+    let values = from.values().clone();
+    let offsets = from.offsets().try_into()?;
+    Ok(BinaryArray::<i32>::new(
+        to_data_type,
+        offsets,
+        values,
+        from.validity().cloned(),
+    ))
+}
+
+/// Conversion to utf8
+pub fn binary_to_utf8<O: Offset>(
+    from: &BinaryArray<O>,
+    to_data_type: DataType,
+) -> Result<Utf8Array<O>> {
+    Utf8Array::<O>::try_new(
+        to_data_type,
+        from.offsets().clone(),
+        from.values().clone(),
+        from.validity().cloned(),
+    )
+}
+
+/// Conversion to utf8
+/// # Errors
+/// This function errors if the values are not valid utf8
+pub fn binary_to_large_utf8(
+    from: &BinaryArray<i32>,
+    to_data_type: DataType,
+) -> Result<Utf8Array<i64>> {
+    let values = from.values().clone();
+    let offsets = from.offsets().into();
+
+    Utf8Array::<i64>::try_new(to_data_type, offsets, values, from.validity().cloned())
+}
+
+/// Casts a [`BinaryArray`] to a [`PrimitiveArray`] at best-effort using `lexical_core::parse_partial`, making any uncastable value as zero.
+pub fn partial_binary_to_primitive<O: Offset, T>(
+    from: &BinaryArray<O>,
+    to: &DataType,
+) -> PrimitiveArray<T>
+where
+    T: NativeType + lexical_core::FromLexical,
+{
+    let iter = from
+        .iter()
+        .map(|x| x.and_then::<T, _>(|x| lexical_core::parse_partial(x).ok().map(|x| x.0)));
+
+    PrimitiveArray::<T>::from_trusted_len_iter(iter).to(to.clone())
+}
+
+/// Casts a [`BinaryArray`] to a [`PrimitiveArray`], making any uncastable value a Null.
+pub fn binary_to_primitive<O: Offset, T>(from: &BinaryArray<O>, to: &DataType) -> PrimitiveArray<T>
+where
+    T: NativeType + lexical_core::FromLexical,
+{
+    let iter = from
+        .iter()
+        .map(|x| x.and_then::<T, _>(|x| lexical_core::parse(x).ok()));
+
+    PrimitiveArray::<T>::from_trusted_len_iter(iter).to(to.clone())
+}
+
+pub(super) fn binary_to_primitive_dyn<O: Offset, T>(
+    from: &dyn Array,
+    to: &DataType,
+    options: CastOptions,
+) -> Result<Box<dyn Array>>
+where
+    T: NativeType + lexical_core::FromLexical,
+{
+    let from = from.as_any().downcast_ref().unwrap();
+    if options.partial {
+        Ok(Box::new(partial_binary_to_primitive::<O, T>(from, to)))
+    } else {
+        Ok(Box::new(binary_to_primitive::<O, T>(from, to)))
+    }
+}
+
+/// Cast [`BinaryArray`] to [`DictionaryArray`], also known as packing.
+/// # Errors
+/// This function errors if the maximum key is smaller than the number of distinct elements
+/// in the array.
+pub fn binary_to_dictionary<O: Offset, K: DictionaryKey>(
+    from: &BinaryArray<O>,
+) -> Result<DictionaryArray<K>> {
+    let mut array = MutableDictionaryArray::<K, MutableBinaryArray<O>>::new();
+    array.try_extend(from.iter())?;
+
+    Ok(array.into())
+}
+
+pub(super) fn binary_to_dictionary_dyn<O: Offset, K: DictionaryKey>(
+    from: &dyn Array,
+) -> Result<Box<dyn Array>> {
+    let values = from.as_any().downcast_ref().unwrap();
+    binary_to_dictionary::<O, K>(values).map(|x| Box::new(x) as Box<dyn Array>)
+}
+
+fn fixed_size_to_offsets<O: Offset>(values_len: usize, fixed_size: usize) -> Offsets<O> {
+    let offsets = (0..(values_len + 1))
+        .step_by(fixed_size)
+        .map(|v| O::from_usize(v).unwrap())
+        .collect();
+    // Safety
+    // * every element is `>= 0`
+    // * element at position `i` is >= than element at position `i-1`.
+    unsafe { Offsets::new_unchecked(offsets) }
+}
+
+/// Conversion of `FixedSizeBinary` to `Binary`.
+pub fn fixed_size_binary_binary<O: Offset>(
+    from: &FixedSizeBinaryArray,
+    to_data_type: DataType,
+) -> BinaryArray<O> {
+    let values = from.values().clone();
+    let offsets = fixed_size_to_offsets(values.len(), from.size());
+    BinaryArray::<O>::new(
+        to_data_type,
+        offsets.into(),
+        values,
+        from.validity().cloned(),
+    )
+}
+
+/// Conversion of binary
+pub fn binary_to_list<O: Offset>(from: &BinaryArray<O>, to_data_type: DataType) -> ListArray<O> {
+    let values = from.values().clone();
+    let values = PrimitiveArray::new(DataType::UInt8, values, None);
+    ListArray::<O>::new(
+        to_data_type,
+        from.offsets().clone(),
+        values.boxed(),
+        from.validity().cloned(),
+    )
+}
diff --git a/crates/nano-arrow/src/compute/cast/boolean_to.rs b/crates/nano-arrow/src/compute/cast/boolean_to.rs
new file mode 100644
index 000000000000..8a8cf7089d8f
--- /dev/null
+++ b/crates/nano-arrow/src/compute/cast/boolean_to.rs
@@ -0,0 +1,48 @@
+use crate::array::{Array, BinaryArray, BooleanArray, PrimitiveArray, Utf8Array};
+use crate::error::Result;
+use crate::offset::Offset;
+use crate::types::NativeType;
+
+pub(super) fn boolean_to_primitive_dyn<T>(array: &dyn Array) -> Result<Box<dyn Array>>
+where
+    T: NativeType + num_traits::One,
+{
+    let array = array.as_any().downcast_ref().unwrap();
+    Ok(Box::new(boolean_to_primitive::<T>(array)))
+}
+
+/// Casts the [`BooleanArray`] to a [`PrimitiveArray`].
+pub fn boolean_to_primitive<T>(from: &BooleanArray) -> PrimitiveArray<T>
+where
+    T: NativeType + num_traits::One,
+{
+    let values = from
+        .values()
+        .iter()
+        .map(|x| if x { T::one() } else { T::default() })
+        .collect::<Vec<_>>();
+
+    PrimitiveArray::<T>::new(T::PRIMITIVE.into(), values.into(), from.validity().cloned())
+}
+
+/// Casts the [`BooleanArray`] to a [`Utf8Array`], casting trues to `"1"` and falses to `"0"`
+pub fn boolean_to_utf8<O: Offset>(from: &BooleanArray) -> Utf8Array<O> {
+    let iter = from.values().iter().map(|x| if x { "1" } else { "0" });
+    Utf8Array::from_trusted_len_values_iter(iter)
+}
+
+pub(super) fn boolean_to_utf8_dyn<O: Offset>(array: &dyn Array) -> Result<Box<dyn Array>> {
+    let array = array.as_any().downcast_ref().unwrap();
+    Ok(Box::new(boolean_to_utf8::<O>(array)))
+}
+
+/// Casts the [`BooleanArray`] to a [`BinaryArray`], casting trues to `"1"` and falses to `"0"`
+pub fn boolean_to_binary<O: Offset>(from: &BooleanArray) -> BinaryArray<O> {
+    let iter = from.values().iter().map(|x| if x { b"1" } else { b"0" });
+    BinaryArray::from_trusted_len_values_iter(iter)
+}
+
+pub(super) fn boolean_to_binary_dyn<O: Offset>(array: &dyn Array) -> Result<Box<dyn Array>> {
+    let array = array.as_any().downcast_ref().unwrap();
+    Ok(Box::new(boolean_to_binary::<O>(array)))
+}
diff --git a/crates/nano-arrow/src/compute/cast/decimal_to.rs b/crates/nano-arrow/src/compute/cast/decimal_to.rs
new file mode 100644
index 000000000000..ba9995c86c12
--- /dev/null
+++ b/crates/nano-arrow/src/compute/cast/decimal_to.rs
@@ -0,0 +1,137 @@
+use num_traits::{AsPrimitive, Float, NumCast};
+
+use crate::array::*;
+use crate::datatypes::DataType;
+use crate::error::Result;
+use crate::types::NativeType;
+
+#[inline]
+fn decimal_to_decimal_impl<F: Fn(i128) -> Option<i128>>(
+    from: &PrimitiveArray<i128>,
+    op: F,
+    to_precision: usize,
+    to_scale: usize,
+) -> PrimitiveArray<i128> {
+    let min_for_precision = 9_i128
+        .saturating_pow(1 + to_precision as u32)
+        .saturating_neg();
+    let max_for_precision = 9_i128.saturating_pow(1 + to_precision as u32);
+
+    let values = from.iter().map(|x| {
+        x.and_then(|x| {
+            op(*x).and_then(|x| {
+                if x > max_for_precision || x < min_for_precision {
+                    None
+                } else {
+                    Some(x)
+                }
+            })
+        })
+    });
+    PrimitiveArray::<i128>::from_trusted_len_iter(values)
+        .to(DataType::Decimal(to_precision, to_scale))
+}
+
+/// Returns a [`PrimitiveArray<i128>`] with the casted values. Values are `None` on overflow
+pub fn decimal_to_decimal(
+    from: &PrimitiveArray<i128>,
+    to_precision: usize,
+    to_scale: usize,
+) -> PrimitiveArray<i128> {
+    let (from_precision, from_scale) =
+        if let DataType::Decimal(p, s) = from.data_type().to_logical_type() {
+            (*p, *s)
+        } else {
+            panic!("internal error: i128 is always a decimal")
+        };
+
+    if to_scale == from_scale && to_precision >= from_precision {
+        // fast path
+        return from.clone().to(DataType::Decimal(to_precision, to_scale));
+    }
+    // todo: other fast paths include increasing scale and precision by so that
+    // a number will never overflow (validity is preserved)
+
+    if from_scale > to_scale {
+        let factor = 10_i128.pow((from_scale - to_scale) as u32);
+        decimal_to_decimal_impl(
+            from,
+            |x: i128| x.checked_div(factor),
+            to_precision,
+            to_scale,
+        )
+    } else {
+        let factor = 10_i128.pow((to_scale - from_scale) as u32);
+        decimal_to_decimal_impl(
+            from,
+            |x: i128| x.checked_mul(factor),
+            to_precision,
+            to_scale,
+        )
+    }
+}
+
+pub(super) fn decimal_to_decimal_dyn(
+    from: &dyn Array,
+    to_precision: usize,
+    to_scale: usize,
+) -> Result<Box<dyn Array>> {
+    let from = from.as_any().downcast_ref().unwrap();
+    Ok(Box::new(decimal_to_decimal(from, to_precision, to_scale)))
+}
+
+/// Returns a [`PrimitiveArray<i128>`] with the casted values. Values are `None` on overflow
+pub fn decimal_to_float<T>(from: &PrimitiveArray<i128>) -> PrimitiveArray<T>
+where
+    T: NativeType + Float,
+    f64: AsPrimitive<T>,
+{
+    let (_, from_scale) = if let DataType::Decimal(p, s) = from.data_type().to_logical_type() {
+        (*p, *s)
+    } else {
+        panic!("internal error: i128 is always a decimal")
+    };
+
+    let div = 10_f64.powi(from_scale as i32);
+    let values = from
+        .values()
+        .iter()
+        .map(|x| (*x as f64 / div).as_())
+        .collect();
+
+    PrimitiveArray::<T>::new(T::PRIMITIVE.into(), values, from.validity().cloned())
+}
+
+pub(super) fn decimal_to_float_dyn<T>(from: &dyn Array) -> Result<Box<dyn Array>>
+where
+    T: NativeType + Float,
+    f64: AsPrimitive<T>,
+{
+    let from = from.as_any().downcast_ref().unwrap();
+    Ok(Box::new(decimal_to_float::<T>(from)))
+}
+
+/// Returns a [`PrimitiveArray<i128>`] with the casted values. Values are `None` on overflow
+pub fn decimal_to_integer<T>(from: &PrimitiveArray<i128>) -> PrimitiveArray<T>
+where
+    T: NativeType + NumCast,
+{
+    let (_, from_scale) = if let DataType::Decimal(p, s) = from.data_type().to_logical_type() {
+        (*p, *s)
+    } else {
+        panic!("internal error: i128 is always a decimal")
+    };
+
+    let factor = 10_i128.pow(from_scale as u32);
+    let values = from.iter().map(|x| x.and_then(|x| T::from(*x / factor)));
+
+    PrimitiveArray::from_trusted_len_iter(values)
+}
+
+pub(super) fn decimal_to_integer_dyn<T>(from: &dyn Array) -> Result<Box<dyn Array>>
+where
+    T: NativeType + NumCast,
+{
+    let from = from.as_any().downcast_ref().unwrap();
+    Ok(Box::new(decimal_to_integer::<T>(from)))
+}
diff --git a/crates/nano-arrow/src/compute/cast/dictionary_to.rs b/crates/nano-arrow/src/compute/cast/dictionary_to.rs
new file mode 100644
index 000000000000..4126e4a3d589
--- /dev/null
+++ b/crates/nano-arrow/src/compute/cast/dictionary_to.rs
@@ -0,0 +1,183 @@
+use super::{primitive_as_primitive, primitive_to_primitive, CastOptions};
+use crate::array::{Array, DictionaryArray, DictionaryKey, PrimitiveArray};
+use crate::compute::cast::cast;
+use crate::compute::take::take;
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+
+macro_rules! key_cast {
+    ($keys:expr, $values:expr, $array:expr, $to_keys_type:expr, $to_type:ty, $to_datatype:expr) => {{
+        let cast_keys = primitive_to_primitive::<_, $to_type>($keys, $to_keys_type);
+
+        // Failure to cast keys (because they don't fit in the
+        // target type) results in NULL values;
+        if cast_keys.null_count() > $keys.null_count() {
+            return Err(Error::Overflow);
+        }
+        // Safety: this is safe because given a type `T` that fits in a `usize`, casting it to type `P` either overflows or also fits in a `usize`
+        unsafe {
+             DictionaryArray::try_new_unchecked($to_datatype, cast_keys, $values.clone())
+        }
+            .map(|x| x.boxed())
+    }};
+}
+
+/// Casts a [`DictionaryArray`] to a new [`DictionaryArray`] by keeping the
+/// keys and casting the values to `values_type`.
+/// # Errors
+/// This function errors if the values are not castable to `values_type`
+pub fn dictionary_to_dictionary_values<K: DictionaryKey>(
+    from: &DictionaryArray<K>,
+    values_type: &DataType,
+) -> Result<DictionaryArray<K>> {
+    let keys = from.keys();
+    let values = from.values();
+    let length = values.len();
+
+    let values = cast(values.as_ref(), values_type, CastOptions::default())?;
+
+    assert_eq!(values.len(), length); // this is guaranteed by `cast`
+    unsafe {
+        DictionaryArray::try_new_unchecked(from.data_type().clone(), keys.clone(), values.clone())
+    }
+}
+
+/// Similar to dictionary_to_dictionary_values, but overflowing cast is wrapped
+pub fn wrapping_dictionary_to_dictionary_values<K: DictionaryKey>(
+    from: &DictionaryArray<K>,
+    values_type: &DataType,
+) -> Result<DictionaryArray<K>> {
+    let keys = from.keys();
+    let values = from.values();
+    let length = values.len();
+
+    let values = cast(
+        values.as_ref(),
+        values_type,
+        CastOptions {
+            wrapped: true,
+            partial: false,
+        },
+    )?;
+    assert_eq!(values.len(), length); // this is guaranteed by `cast`
+    unsafe {
+        DictionaryArray::try_new_unchecked(from.data_type().clone(), keys.clone(), values.clone())
+    }
+}
+
+/// Casts a [`DictionaryArray`] to a new [`DictionaryArray`] backed by a
+/// different physical type of the keys, while keeping the values equal.
+/// # Errors
+/// Errors if any of the old keys' values is larger than the maximum value
+/// supported by the new physical type.
+pub fn dictionary_to_dictionary_keys<K1, K2>(
+    from: &DictionaryArray<K1>,
+) -> Result<DictionaryArray<K2>>
+where
+    K1: DictionaryKey + num_traits::NumCast,
+    K2: DictionaryKey + num_traits::NumCast,
+{
+    let keys = from.keys();
+    let values = from.values();
+    let is_ordered = from.is_ordered();
+
+    let casted_keys = primitive_to_primitive::<K1, K2>(keys, &K2::PRIMITIVE.into());
+
+    if casted_keys.null_count() > keys.null_count() {
+        Err(Error::Overflow)
+    } else {
+        let data_type = DataType::Dictionary(
+            K2::KEY_TYPE,
+            Box::new(values.data_type().clone()),
+            is_ordered,
+        );
+        // Safety: this is safe because given a type `T` that fits in a `usize`, casting it to type `P` either overflows or also fits in a `usize`
+        unsafe { DictionaryArray::try_new_unchecked(data_type, casted_keys, values.clone()) }
+    }
+}
+
+/// Similar to dictionary_to_dictionary_keys, but overflowing cast is wrapped
+pub fn wrapping_dictionary_to_dictionary_keys<K1, K2>(
+    from: &DictionaryArray<K1>,
+) -> Result<DictionaryArray<K2>>
+where
+    K1: DictionaryKey + num_traits::AsPrimitive<K2>,
+    K2: DictionaryKey,
+{
+    let keys = from.keys();
+    let values = from.values();
+    let is_ordered = from.is_ordered();
+
+    let casted_keys = primitive_as_primitive::<K1, K2>(keys, &K2::PRIMITIVE.into());
+
+    if casted_keys.null_count() > keys.null_count() {
+        Err(Error::Overflow)
+    } else {
+        let data_type = DataType::Dictionary(
+            K2::KEY_TYPE,
+            Box::new(values.data_type().clone()),
+            is_ordered,
+        );
+        // some of the values may not fit in `usize` and thus this needs to be checked
+        DictionaryArray::try_new(data_type, casted_keys, values.clone())
+    }
+}
+
+pub(super) fn dictionary_cast_dyn<K: DictionaryKey + num_traits::NumCast>(
+    array: &dyn Array,
+    to_type: &DataType,
+    options: CastOptions,
+) -> Result<Box<dyn Array>> {
+    let array = array.as_any().downcast_ref::<DictionaryArray<K>>().unwrap();
+    let keys = array.keys();
+    let values = array.values();
+
+    match to_type {
+        DataType::Dictionary(to_keys_type, to_values_type, _) => {
+            let values = cast(values.as_ref(), to_values_type, options)?;
+
+            // create the appropriate array type
+            let to_key_type = (*to_keys_type).into();
+
+            // Safety:
+            // we return an error on overflow so the integers remain within bounds
+            match_integer_type!(to_keys_type, |$T| {
+                key_cast!(keys, values, array, &to_key_type, $T, to_type.clone())
+            })
+        },
+        _ => unpack_dictionary::<K>(keys, values.as_ref(), to_type, options),
+    }
+}
+
+// Unpack the dictionary
+fn unpack_dictionary<K>(
+    keys: &PrimitiveArray<K>,
+    values: &dyn Array,
+    to_type: &DataType,
+    options: CastOptions,
+) -> Result<Box<dyn Array>>
+where
+    K: DictionaryKey + num_traits::NumCast,
+{
+    // attempt to cast the dict values to the target type
+    // use the take kernel to expand out the dictionary
+    let values = cast(values, to_type, options)?;
+
+    // take requires first casting i32
+    let indices = primitive_to_primitive::<_, i32>(keys, &DataType::Int32);
+
+    take(values.as_ref(), &indices)
+}
+
+/// Casts a [`DictionaryArray`] to its values' [`DataType`], also known as unpacking.
+/// The resulting array has the same length.
+pub fn dictionary_to_values<K>(from: &DictionaryArray<K>) -> Box<dyn Array>
+where
+    K: DictionaryKey + num_traits::NumCast,
+{
+    // take requires first casting i64
+    let indices = primitive_to_primitive::<_, i64>(from.keys(), &DataType::Int64);
+
+    // unwrap: The dictionary guarantees that the keys are not out-of-bounds.
+    take(from.values().as_ref(), &indices).unwrap()
+}
diff --git a/crates/nano-arrow/src/compute/cast/mod.rs b/crates/nano-arrow/src/compute/cast/mod.rs
new file mode 100644
index 000000000000..f13a638a9c0d
--- /dev/null
+++ b/crates/nano-arrow/src/compute/cast/mod.rs
@@ -0,0 +1,989 @@
+//! Defines different casting operators such as [`cast`] or [`primitive_to_binary`].
+
+mod binary_to;
+mod boolean_to;
+mod decimal_to;
+mod dictionary_to;
+mod primitive_to;
+mod utf8_to;
+
+pub use binary_to::*;
+pub use boolean_to::*;
+pub use decimal_to::*;
+pub use dictionary_to::*;
+pub use primitive_to::*;
+pub use utf8_to::*;
+
+use crate::array::*;
+use crate::datatypes::*;
+use crate::error::{Error, Result};
+use crate::offset::{Offset, Offsets};
+
+/// options defining how Cast kernels behave
+#[derive(Clone, Copy, Debug, Default)]
+pub struct CastOptions {
+    /// default to false
+    /// whether an overflowing cast should be converted to `None` (default), or be wrapped (i.e. `256i16 as u8 = 0` vectorized).
+    /// Settings this to `true` is 5-6x faster for numeric types.
+    pub wrapped: bool,
+    /// default to false
+    /// whether to cast to an integer at the best-effort
+    pub partial: bool,
+}
+
+impl CastOptions {
+    fn with_wrapped(&self, v: bool) -> Self {
+        let mut option = *self;
+        option.wrapped = v;
+        option
+    }
+}
+
+/// Returns true if this type is numeric: (UInt*, Unit*, or Float*).
+fn is_numeric(t: &DataType) -> bool {
+    use DataType::*;
+    matches!(
+        t,
+        UInt8 | UInt16 | UInt32 | UInt64 | Int8 | Int16 | Int32 | Int64 | Float32 | Float64
+    )
+}
+
+macro_rules! primitive_dyn {
+    ($from:expr, $expr:tt) => {{
+        let from = $from.as_any().downcast_ref().unwrap();
+        Ok(Box::new($expr(from)))
+    }};
+    ($from:expr, $expr:tt, $to:expr) => {{
+        let from = $from.as_any().downcast_ref().unwrap();
+        Ok(Box::new($expr(from, $to)))
+    }};
+    ($from:expr, $expr:tt, $from_t:expr, $to:expr) => {{
+        let from = $from.as_any().downcast_ref().unwrap();
+        Ok(Box::new($expr(from, $from_t, $to)))
+    }};
+    ($from:expr, $expr:tt, $arg1:expr, $arg2:expr, $arg3:expr) => {{
+        let from = $from.as_any().downcast_ref().unwrap();
+        Ok(Box::new($expr(from, $arg1, $arg2, $arg3)))
+    }};
+}
+
+/// Return true if a value of type `from_type` can be cast into a
+/// value of `to_type`. Note that such as cast may be lossy.
+///
+/// If this function returns true to stay consistent with the `cast` kernel below.
+pub fn can_cast_types(from_type: &DataType, to_type: &DataType) -> bool {
+    use self::DataType::*;
+    if from_type == to_type {
+        return true;
+    }
+
+    match (from_type, to_type) {
+        (Null, _) | (_, Null) => true,
+        (Struct(_), _) => false,
+        (_, Struct(_)) => false,
+        (FixedSizeList(list_from, _), List(list_to)) => {
+            can_cast_types(&list_from.data_type, &list_to.data_type)
+        },
+        (FixedSizeList(list_from, _), LargeList(list_to)) => {
+            can_cast_types(&list_from.data_type, &list_to.data_type)
+        },
+        (List(list_from), FixedSizeList(list_to, _)) => {
+            can_cast_types(&list_from.data_type, &list_to.data_type)
+        },
+        (LargeList(list_from), FixedSizeList(list_to, _)) => {
+            can_cast_types(&list_from.data_type, &list_to.data_type)
+        },
+        (List(list_from), List(list_to)) => {
+            can_cast_types(&list_from.data_type, &list_to.data_type)
+        },
+        (LargeList(list_from), LargeList(list_to)) => {
+            can_cast_types(&list_from.data_type, &list_to.data_type)
+        },
+        (List(list_from), LargeList(list_to)) if list_from == list_to => true,
+        (LargeList(list_from), List(list_to)) if list_from == list_to => true,
+        (_, List(list_to)) => can_cast_types(from_type, &list_to.data_type),
+        (_, LargeList(list_to)) if from_type != &LargeBinary => {
+            can_cast_types(from_type, &list_to.data_type)
+        },
+        (Dictionary(_, from_value_type, _), Dictionary(_, to_value_type, _)) => {
+            can_cast_types(from_value_type, to_value_type)
+        },
+        (Dictionary(_, value_type, _), _) => can_cast_types(value_type, to_type),
+        (_, Dictionary(_, value_type, _)) => can_cast_types(from_type, value_type),
+
+        (_, Boolean) => is_numeric(from_type),
+        (Boolean, _) => {
+            is_numeric(to_type)
+                || to_type == &Utf8
+                || to_type == &LargeUtf8
+                || to_type == &Binary
+                || to_type == &LargeBinary
+        },
+
+        (Utf8, to_type) => {
+            is_numeric(to_type)
+                || matches!(
+                    to_type,
+                    LargeUtf8 | Binary | Date32 | Date64 | Timestamp(TimeUnit::Nanosecond, _)
+                )
+        },
+        (LargeUtf8, to_type) => {
+            is_numeric(to_type)
+                || matches!(
+                    to_type,
+                    Utf8 | LargeBinary | Date32 | Date64 | Timestamp(TimeUnit::Nanosecond, _)
+                )
+        },
+
+        (Binary, to_type) => {
+            is_numeric(to_type) || matches!(to_type, LargeBinary | Utf8 | LargeUtf8)
+        },
+        (LargeBinary, to_type) => {
+            is_numeric(to_type)
+                || match to_type {
+                    Binary | LargeUtf8 => true,
+                    LargeList(field) => matches!(field.data_type, UInt8),
+                    _ => false,
+                }
+        },
+        (FixedSizeBinary(_), to_type) => matches!(to_type, Binary | LargeBinary),
+        (Timestamp(_, _), Utf8) => true,
+        (Timestamp(_, _), LargeUtf8) => true,
+        (_, Utf8) => is_numeric(from_type) || from_type == &Binary,
+        (_, LargeUtf8) => is_numeric(from_type) || from_type == &LargeBinary,
+
+        (_, Binary) => is_numeric(from_type),
+        (_, LargeBinary) => is_numeric(from_type),
+
+        // start numeric casts
+        (UInt8, UInt16) => true,
+        (UInt8, UInt32) => true,
+        (UInt8, UInt64) => true,
+        (UInt8, Int8) => true,
+        (UInt8, Int16) => true,
+        (UInt8, Int32) => true,
+        (UInt8, Int64) => true,
+        (UInt8, Float32) => true,
+        (UInt8, Float64) => true,
+        (UInt8, Decimal(_, _)) => true,
+
+        (UInt16, UInt8) => true,
+        (UInt16, UInt32) => true,
+        (UInt16, UInt64) => true,
+        (UInt16, Int8) => true,
+        (UInt16, Int16) => true,
+        (UInt16, Int32) => true,
+        (UInt16, Int64) => true,
+        (UInt16, Float32) => true,
+        (UInt16, Float64) => true,
+        (UInt16, Decimal(_, _)) => true,
+
+        (UInt32, UInt8) => true,
+        (UInt32, UInt16) => true,
+        (UInt32, UInt64) => true,
+        (UInt32, Int8) => true,
+        (UInt32, Int16) => true,
+        (UInt32, Int32) => true,
+        (UInt32, Int64) => true,
+        (UInt32, Float32) => true,
+        (UInt32, Float64) => true,
+        (UInt32, Decimal(_, _)) => true,
+
+        (UInt64, UInt8) => true,
+        (UInt64, UInt16) => true,
+        (UInt64, UInt32) => true,
+        (UInt64, Int8) => true,
+        (UInt64, Int16) => true,
+        (UInt64, Int32) => true,
+        (UInt64, Int64) => true,
+        (UInt64, Float32) => true,
+        (UInt64, Float64) => true,
+        (UInt64, Decimal(_, _)) => true,
+
+        (Int8, UInt8) => true,
+        (Int8, UInt16) => true,
+        (Int8, UInt32) => true,
+        (Int8, UInt64) => true,
+        (Int8, Int16) => true,
+        (Int8, Int32) => true,
+        (Int8, Int64) => true,
+        (Int8, Float32) => true,
+        (Int8, Float64) => true,
+        (Int8, Decimal(_, _)) => true,
+
+        (Int16, UInt8) => true,
+        (Int16, UInt16) => true,
+        (Int16, UInt32) => true,
+        (Int16, UInt64) => true,
+        (Int16, Int8) => true,
+        (Int16, Int32) => true,
+        (Int16, Int64) => true,
+        (Int16, Float32) => true,
+        (Int16, Float64) => true,
+        (Int16, Decimal(_, _)) => true,
+
+        (Int32, UInt8) => true,
+        (Int32, UInt16) => true,
+        (Int32, UInt32) => true,
+        (Int32, UInt64) => true,
+        (Int32, Int8) => true,
+        (Int32, Int16) => true,
+        (Int32, Int64) => true,
+        (Int32, Float32) => true,
+        (Int32, Float64) => true,
+        (Int32, Decimal(_, _)) => true,
+
+        (Int64, UInt8) => true,
+        (Int64, UInt16) => true,
+        (Int64, UInt32) => true,
+        (Int64, UInt64) => true,
+        (Int64, Int8) => true,
+        (Int64, Int16) => true,
+        (Int64, Int32) => true,
+        (Int64, Float32) => true,
+        (Int64, Float64) => true,
+        (Int64, Decimal(_, _)) => true,
+
+        (Float16, Float32) => true,
+
+        (Float32, UInt8) => true,
+        (Float32, UInt16) => true,
+        (Float32, UInt32) => true,
+        (Float32, UInt64) => true,
+        (Float32, Int8) => true,
+        (Float32, Int16) => true,
+        (Float32, Int32) => true,
+        (Float32, Int64) => true,
+        (Float32, Float64) => true,
+        (Float32, Decimal(_, _)) => true,
+
+        (Float64, UInt8) => true,
+        (Float64, UInt16) => true,
+        (Float64, UInt32) => true,
+        (Float64, UInt64) => true,
+        (Float64, Int8) => true,
+        (Float64, Int16) => true,
+        (Float64, Int32) => true,
+        (Float64, Int64) => true,
+        (Float64, Float32) => true,
+        (Float64, Decimal(_, _)) => true,
+
+        (
+            Decimal(_, _),
+            UInt8
+            | UInt16
+            | UInt32
+            | UInt64
+            | Int8
+            | Int16
+            | Int32
+            | Int64
+            | Float32
+            | Float64
+            | Decimal(_, _),
+        ) => true,
+        // end numeric casts
+
+        // temporal casts
+        (Int32, Date32) => true,
+        (Int32, Time32(_)) => true,
+        (Date32, Int32) => true,
+        (Date32, Int64) => true,
+        (Time32(_), Int32) => true,
+        (Int64, Date64) => true,
+        (Int64, Time64(_)) => true,
+        (Date64, Int32) => true,
+        (Date64, Int64) => true,
+        (Time64(_), Int64) => true,
+        (Date32, Date64) => true,
+        (Date64, Date32) => true,
+        (Time32(TimeUnit::Second), Time32(TimeUnit::Millisecond)) => true,
+        (Time32(TimeUnit::Millisecond), Time32(TimeUnit::Second)) => true,
+        (Time32(_), Time64(_)) => true,
+        (Time64(TimeUnit::Microsecond), Time64(TimeUnit::Nanosecond)) => true,
+        (Time64(TimeUnit::Nanosecond), Time64(TimeUnit::Microsecond)) => true,
+        (Time64(_), Time32(to_unit)) => {
+            matches!(to_unit, TimeUnit::Second | TimeUnit::Millisecond)
+        },
+        (Timestamp(_, _), Int64) => true,
+        (Int64, Timestamp(_, _)) => true,
+        (Timestamp(_, _), Timestamp(_, _)) => true,
+        (Timestamp(_, _), Date32) => true,
+        (Timestamp(_, _), Date64) => true,
+        (Int64, Duration(_)) => true,
+        (Duration(_), Int64) => true,
+        (Interval(_), Interval(IntervalUnit::MonthDayNano)) => true,
+        (_, _) => false,
+    }
+}
+
+fn cast_list<O: Offset>(
+    array: &ListArray<O>,
+    to_type: &DataType,
+    options: CastOptions,
+) -> Result<ListArray<O>> {
+    let values = array.values();
+    let new_values = cast(
+        values.as_ref(),
+        ListArray::<O>::get_child_type(to_type),
+        options,
+    )?;
+
+    Ok(ListArray::<O>::new(
+        to_type.clone(),
+        array.offsets().clone(),
+        new_values,
+        array.validity().cloned(),
+    ))
+}
+
+fn cast_list_to_large_list(array: &ListArray<i32>, to_type: &DataType) -> ListArray<i64> {
+    let offsets = array.offsets().into();
+
+    ListArray::<i64>::new(
+        to_type.clone(),
+        offsets,
+        array.values().clone(),
+        array.validity().cloned(),
+    )
+}
+
+fn cast_large_to_list(array: &ListArray<i64>, to_type: &DataType) -> ListArray<i32> {
+    let offsets = array.offsets().try_into().expect("Convertme to error");
+
+    ListArray::<i32>::new(
+        to_type.clone(),
+        offsets,
+        array.values().clone(),
+        array.validity().cloned(),
+    )
+}
+
+fn cast_fixed_size_list_to_list<O: Offset>(
+    fixed: &FixedSizeListArray,
+    to_type: &DataType,
+    options: CastOptions,
+) -> Result<ListArray<O>> {
+    let new_values = cast(
+        fixed.values().as_ref(),
+        ListArray::<O>::get_child_type(to_type),
+        options,
+    )?;
+
+    let offsets = (0..=fixed.len())
+        .map(|ix| O::from_as_usize(ix * fixed.size()))
+        .collect::<Vec<_>>();
+    // Safety: offsets _are_ monotonically increasing
+    let offsets = unsafe { Offsets::new_unchecked(offsets) };
+
+    Ok(ListArray::<O>::new(
+        to_type.clone(),
+        offsets.into(),
+        new_values,
+        fixed.validity().cloned(),
+    ))
+}
+
+fn cast_list_to_fixed_size_list<O: Offset>(
+    list: &ListArray<O>,
+    inner: &Field,
+    size: usize,
+    options: CastOptions,
+) -> Result<FixedSizeListArray> {
+    let offsets = list.offsets().buffer().iter();
+    let expected = (0..list.len()).map(|ix| O::from_as_usize(ix * size));
+
+    match offsets
+        .zip(expected)
+        .find(|(actual, expected)| *actual != expected)
+    {
+        Some(_) => Err(Error::InvalidArgumentError(
+            "incompatible offsets in source list".to_string(),
+        )),
+        None => {
+            let sliced_values = list.values().sliced(
+                list.offsets().first().to_usize(),
+                list.offsets().range().to_usize(),
+            );
+            let new_values = cast(sliced_values.as_ref(), inner.data_type(), options)?;
+            Ok(FixedSizeListArray::new(
+                DataType::FixedSizeList(Box::new(inner.clone()), size),
+                new_values,
+                list.validity().cloned(),
+            ))
+        },
+    }
+}
+
+/// Cast `array` to the provided data type and return a new [`Array`] with
+/// type `to_type`, if possible.
+///
+/// Behavior:
+/// * PrimitiveArray to PrimitiveArray: overflowing cast will be None
+/// * Boolean to Utf8: `true` => '1', `false` => `0`
+/// * Utf8 to numeric: strings that can't be parsed to numbers return null, float strings
+///   in integer casts return null
+/// * Numeric to boolean: 0 returns `false`, any other value returns `true`
+/// * List to List: the underlying data type is cast
+/// * Fixed Size List to List: the underlying data type is cast
+/// * List to Fixed Size List: the offsets are checked for valid order, then the
+///   underlying type is cast.
+/// * PrimitiveArray to List: a list array with 1 value per slot is created
+/// * Date32 and Date64: precision lost when going to higher interval
+/// * Time32 and Time64: precision lost when going to higher interval
+/// * Timestamp and Date{32|64}: precision lost when going to higher interval
+/// * Temporal to/from backing primitive: zero-copy with data type change
+/// Unsupported Casts
+/// * To or from `StructArray`
+/// * List to primitive
+/// * Utf8 to boolean
+/// * Interval and duration
+pub fn cast(array: &dyn Array, to_type: &DataType, options: CastOptions) -> Result<Box<dyn Array>> {
+    use DataType::*;
+    let from_type = array.data_type();
+
+    // clone array if types are the same
+    if from_type == to_type {
+        return Ok(clone(array));
+    }
+
+    let as_options = options.with_wrapped(true);
+    match (from_type, to_type) {
+        (Null, _) | (_, Null) => Ok(new_null_array(to_type.clone(), array.len())),
+        (Struct(_), _) => Err(Error::NotYetImplemented(
+            "Cannot cast from struct to other types".to_string(),
+        )),
+        (_, Struct(_)) => Err(Error::NotYetImplemented(
+            "Cannot cast to struct from other types".to_string(),
+        )),
+        (List(_), FixedSizeList(inner, size)) => cast_list_to_fixed_size_list::<i32>(
+            array.as_any().downcast_ref().unwrap(),
+            inner.as_ref(),
+            *size,
+            options,
+        )
+        .map(|x| x.boxed()),
+        (LargeList(_), FixedSizeList(inner, size)) => cast_list_to_fixed_size_list::<i64>(
+            array.as_any().downcast_ref().unwrap(),
+            inner.as_ref(),
+            *size,
+            options,
+        )
+        .map(|x| x.boxed()),
+        (FixedSizeList(_, _), List(_)) => cast_fixed_size_list_to_list::<i32>(
+            array.as_any().downcast_ref().unwrap(),
+            to_type,
+            options,
+        )
+        .map(|x| x.boxed()),
+        (FixedSizeList(_, _), LargeList(_)) => cast_fixed_size_list_to_list::<i64>(
+            array.as_any().downcast_ref().unwrap(),
+            to_type,
+            options,
+        )
+        .map(|x| x.boxed()),
+        (List(_), List(_)) => {
+            cast_list::<i32>(array.as_any().downcast_ref().unwrap(), to_type, options)
+                .map(|x| x.boxed())
+        },
+        (LargeList(_), LargeList(_)) => {
+            cast_list::<i64>(array.as_any().downcast_ref().unwrap(), to_type, options)
+                .map(|x| x.boxed())
+        },
+        (List(lhs), LargeList(rhs)) if lhs == rhs => {
+            Ok(cast_list_to_large_list(array.as_any().downcast_ref().unwrap(), to_type).boxed())
+        },
+        (LargeList(lhs), List(rhs)) if lhs == rhs => {
+            Ok(cast_large_to_list(array.as_any().downcast_ref().unwrap(), to_type).boxed())
+        },
+
+        (_, List(to)) => {
+            // cast primitive to list's primitive
+            let values = cast(array, &to.data_type, options)?;
+            // create offsets, where if array.len() = 2, we have [0,1,2]
+            let offsets = (0..=array.len() as i32).collect::<Vec<_>>();
+            // Safety: offsets _are_ monotonically increasing
+            let offsets = unsafe { Offsets::new_unchecked(offsets) };
+
+            let list_array = ListArray::<i32>::new(to_type.clone(), offsets.into(), values, None);
+
+            Ok(Box::new(list_array))
+        },
+
+        (_, LargeList(to)) if from_type != &LargeBinary => {
+            // cast primitive to list's primitive
+            let values = cast(array, &to.data_type, options)?;
+            // create offsets, where if array.len() = 2, we have [0,1,2]
+            let offsets = (0..=array.len() as i64).collect::<Vec<_>>();
+            // Safety: offsets _are_ monotonically increasing
+            let offsets = unsafe { Offsets::new_unchecked(offsets) };
+
+            let list_array = ListArray::<i64>::new(to_type.clone(), offsets.into(), values, None);
+
+            Ok(Box::new(list_array))
+        },
+
+        (Dictionary(index_type, ..), _) => match_integer_type!(index_type, |$T| {
+            dictionary_cast_dyn::<$T>(array, to_type, options)
+        }),
+        (_, Dictionary(index_type, value_type, _)) => match_integer_type!(index_type, |$T| {
+            cast_to_dictionary::<$T>(array, value_type, options)
+        }),
+        (_, Boolean) => match from_type {
+            UInt8 => primitive_to_boolean_dyn::<u8>(array, to_type.clone()),
+            UInt16 => primitive_to_boolean_dyn::<u16>(array, to_type.clone()),
+            UInt32 => primitive_to_boolean_dyn::<u32>(array, to_type.clone()),
+            UInt64 => primitive_to_boolean_dyn::<u64>(array, to_type.clone()),
+            Int8 => primitive_to_boolean_dyn::<i8>(array, to_type.clone()),
+            Int16 => primitive_to_boolean_dyn::<i16>(array, to_type.clone()),
+            Int32 => primitive_to_boolean_dyn::<i32>(array, to_type.clone()),
+            Int64 => primitive_to_boolean_dyn::<i64>(array, to_type.clone()),
+            Float32 => primitive_to_boolean_dyn::<f32>(array, to_type.clone()),
+            Float64 => primitive_to_boolean_dyn::<f64>(array, to_type.clone()),
+            _ => Err(Error::NotYetImplemented(format!(
+                "Casting from {from_type:?} to {to_type:?} not supported",
+            ))),
+        },
+        (Boolean, _) => match to_type {
+            UInt8 => boolean_to_primitive_dyn::<u8>(array),
+            UInt16 => boolean_to_primitive_dyn::<u16>(array),
+            UInt32 => boolean_to_primitive_dyn::<u32>(array),
+            UInt64 => boolean_to_primitive_dyn::<u64>(array),
+            Int8 => boolean_to_primitive_dyn::<i8>(array),
+            Int16 => boolean_to_primitive_dyn::<i16>(array),
+            Int32 => boolean_to_primitive_dyn::<i32>(array),
+            Int64 => boolean_to_primitive_dyn::<i64>(array),
+            Float32 => boolean_to_primitive_dyn::<f32>(array),
+            Float64 => boolean_to_primitive_dyn::<f64>(array),
+            LargeUtf8 => boolean_to_utf8_dyn::<i64>(array),
+            LargeBinary => boolean_to_binary_dyn::<i64>(array),
+            _ => Err(Error::NotYetImplemented(format!(
+                "Casting from {from_type:?} to {to_type:?} not supported",
+            ))),
+        },
+
+        (Utf8, _) => match to_type {
+            UInt8 => utf8_to_primitive_dyn::<i32, u8>(array, to_type, options),
+            UInt16 => utf8_to_primitive_dyn::<i32, u16>(array, to_type, options),
+            UInt32 => utf8_to_primitive_dyn::<i32, u32>(array, to_type, options),
+            UInt64 => utf8_to_primitive_dyn::<i32, u64>(array, to_type, options),
+            Int8 => utf8_to_primitive_dyn::<i32, i8>(array, to_type, options),
+            Int16 => utf8_to_primitive_dyn::<i32, i16>(array, to_type, options),
+            Int32 => utf8_to_primitive_dyn::<i32, i32>(array, to_type, options),
+            Int64 => utf8_to_primitive_dyn::<i32, i64>(array, to_type, options),
+            Float32 => utf8_to_primitive_dyn::<i32, f32>(array, to_type, options),
+            Float64 => utf8_to_primitive_dyn::<i32, f64>(array, to_type, options),
+            Date32 => utf8_to_date32_dyn::<i32>(array),
+            Date64 => utf8_to_date64_dyn::<i32>(array),
+            LargeUtf8 => Ok(Box::new(utf8_to_large_utf8(
+                array.as_any().downcast_ref().unwrap(),
+            ))),
+            Timestamp(TimeUnit::Nanosecond, None) => utf8_to_naive_timestamp_ns_dyn::<i32>(array),
+            Timestamp(TimeUnit::Nanosecond, Some(tz)) => {
+                utf8_to_timestamp_ns_dyn::<i32>(array, tz.clone())
+            },
+            _ => Err(Error::NotYetImplemented(format!(
+                "Casting from {from_type:?} to {to_type:?} not supported",
+            ))),
+        },
+        (LargeUtf8, _) => match to_type {
+            UInt8 => utf8_to_primitive_dyn::<i64, u8>(array, to_type, options),
+            UInt16 => utf8_to_primitive_dyn::<i64, u16>(array, to_type, options),
+            UInt32 => utf8_to_primitive_dyn::<i64, u32>(array, to_type, options),
+            UInt64 => utf8_to_primitive_dyn::<i64, u64>(array, to_type, options),
+            Int8 => utf8_to_primitive_dyn::<i64, i8>(array, to_type, options),
+            Int16 => utf8_to_primitive_dyn::<i64, i16>(array, to_type, options),
+            Int32 => utf8_to_primitive_dyn::<i64, i32>(array, to_type, options),
+            Int64 => utf8_to_primitive_dyn::<i64, i64>(array, to_type, options),
+            Float32 => utf8_to_primitive_dyn::<i64, f32>(array, to_type, options),
+            Float64 => utf8_to_primitive_dyn::<i64, f64>(array, to_type, options),
+            Date32 => utf8_to_date32_dyn::<i64>(array),
+            Date64 => utf8_to_date64_dyn::<i64>(array),
+            Utf8 => utf8_large_to_utf8(array.as_any().downcast_ref().unwrap()).map(|x| x.boxed()),
+            LargeBinary => Ok(utf8_to_binary::<i64>(
+                array.as_any().downcast_ref().unwrap(),
+                to_type.clone(),
+            )
+            .boxed()),
+            Timestamp(TimeUnit::Nanosecond, None) => utf8_to_naive_timestamp_ns_dyn::<i64>(array),
+            Timestamp(TimeUnit::Nanosecond, Some(tz)) => {
+                utf8_to_timestamp_ns_dyn::<i64>(array, tz.clone())
+            },
+            _ => Err(Error::NotYetImplemented(format!(
+                "Casting from {from_type:?} to {to_type:?} not supported",
+            ))),
+        },
+
+        (_, Utf8) => match from_type {
+            UInt8 => primitive_to_utf8_dyn::<u8, i32>(array),
+            UInt16 => primitive_to_utf8_dyn::<u16, i32>(array),
+            UInt32 => primitive_to_utf8_dyn::<u32, i32>(array),
+            UInt64 => primitive_to_utf8_dyn::<u64, i32>(array),
+            Int8 => primitive_to_utf8_dyn::<i8, i32>(array),
+            Int16 => primitive_to_utf8_dyn::<i16, i32>(array),
+            Int32 => primitive_to_utf8_dyn::<i32, i32>(array),
+            Int64 => primitive_to_utf8_dyn::<i64, i32>(array),
+            Float32 => primitive_to_utf8_dyn::<f32, i32>(array),
+            Float64 => primitive_to_utf8_dyn::<f64, i32>(array),
+            Timestamp(from_unit, Some(tz)) => {
+                let from = array.as_any().downcast_ref().unwrap();
+                Ok(Box::new(timestamp_to_utf8::<i32>(from, *from_unit, tz)?))
+            },
+            Timestamp(from_unit, None) => {
+                let from = array.as_any().downcast_ref().unwrap();
+                Ok(Box::new(naive_timestamp_to_utf8::<i32>(from, *from_unit)))
+            },
+            _ => Err(Error::NotYetImplemented(format!(
+                "Casting from {from_type:?} to {to_type:?} not supported",
+            ))),
+        },
+
+        (_, LargeUtf8) => match from_type {
+            UInt8 => primitive_to_utf8_dyn::<u8, i64>(array),
+            UInt16 => primitive_to_utf8_dyn::<u16, i64>(array),
+            UInt32 => primitive_to_utf8_dyn::<u32, i64>(array),
+            UInt64 => primitive_to_utf8_dyn::<u64, i64>(array),
+            Int8 => primitive_to_utf8_dyn::<i8, i64>(array),
+            Int16 => primitive_to_utf8_dyn::<i16, i64>(array),
+            Int32 => primitive_to_utf8_dyn::<i32, i64>(array),
+            Int64 => primitive_to_utf8_dyn::<i64, i64>(array),
+            Float32 => primitive_to_utf8_dyn::<f32, i64>(array),
+            Float64 => primitive_to_utf8_dyn::<f64, i64>(array),
+            LargeBinary => {
+                binary_to_utf8::<i64>(array.as_any().downcast_ref().unwrap(), to_type.clone())
+                    .map(|x| x.boxed())
+            },
+            Timestamp(from_unit, Some(tz)) => {
+                let from = array.as_any().downcast_ref().unwrap();
+                Ok(Box::new(timestamp_to_utf8::<i64>(from, *from_unit, tz)?))
+            },
+            Timestamp(from_unit, None) => {
+                let from = array.as_any().downcast_ref().unwrap();
+                Ok(Box::new(naive_timestamp_to_utf8::<i64>(from, *from_unit)))
+            },
+            _ => Err(Error::NotYetImplemented(format!(
+                "Casting from {from_type:?} to {to_type:?} not supported",
+            ))),
+        },
+
+        (Binary, _) => match to_type {
+            UInt8 => binary_to_primitive_dyn::<i32, u8>(array, to_type, options),
+            UInt16 => binary_to_primitive_dyn::<i32, u16>(array, to_type, options),
+            UInt32 => binary_to_primitive_dyn::<i32, u32>(array, to_type, options),
+            UInt64 => binary_to_primitive_dyn::<i32, u64>(array, to_type, options),
+            Int8 => binary_to_primitive_dyn::<i32, i8>(array, to_type, options),
+            Int16 => binary_to_primitive_dyn::<i32, i16>(array, to_type, options),
+            Int32 => binary_to_primitive_dyn::<i32, i32>(array, to_type, options),
+            Int64 => binary_to_primitive_dyn::<i32, i64>(array, to_type, options),
+            Float32 => binary_to_primitive_dyn::<i32, f32>(array, to_type, options),
+            Float64 => binary_to_primitive_dyn::<i32, f64>(array, to_type, options),
+            LargeBinary => Ok(Box::new(binary_to_large_binary(
+                array.as_any().downcast_ref().unwrap(),
+                to_type.clone(),
+            ))),
+            _ => Err(Error::NotYetImplemented(format!(
+                "Casting from {from_type:?} to {to_type:?} not supported",
+            ))),
+        },
+
+        (LargeBinary, _) => {
+            match to_type {
+                UInt8 => binary_to_primitive_dyn::<i64, u8>(array, to_type, options),
+                UInt16 => binary_to_primitive_dyn::<i64, u16>(array, to_type, options),
+                UInt32 => binary_to_primitive_dyn::<i64, u32>(array, to_type, options),
+                UInt64 => binary_to_primitive_dyn::<i64, u64>(array, to_type, options),
+                Int8 => binary_to_primitive_dyn::<i64, i8>(array, to_type, options),
+                Int16 => binary_to_primitive_dyn::<i64, i16>(array, to_type, options),
+                Int32 => binary_to_primitive_dyn::<i64, i32>(array, to_type, options),
+                Int64 => binary_to_primitive_dyn::<i64, i64>(array, to_type, options),
+                Float32 => binary_to_primitive_dyn::<i64, f32>(array, to_type, options),
+                Float64 => binary_to_primitive_dyn::<i64, f64>(array, to_type, options),
+                Binary => {
+                    binary_large_to_binary(array.as_any().downcast_ref().unwrap(), to_type.clone())
+                        .map(|x| x.boxed())
+                },
+                LargeUtf8 => {
+                    binary_to_utf8::<i64>(array.as_any().downcast_ref().unwrap(), to_type.clone())
+                        .map(|x| x.boxed())
+                },
+                LargeList(inner) if matches!(inner.data_type, DataType::UInt8) => Ok(
+                    binary_to_list::<i64>(array.as_any().downcast_ref().unwrap(), to_type.clone())
+                        .boxed(),
+                ),
+                _ => Err(Error::NotYetImplemented(format!(
+                    "Casting from {from_type:?} to {to_type:?} not supported",
+                ))),
+            }
+        },
+        (FixedSizeBinary(_), _) => match to_type {
+            Binary => Ok(fixed_size_binary_binary::<i32>(
+                array.as_any().downcast_ref().unwrap(),
+                to_type.clone(),
+            )
+            .boxed()),
+            LargeBinary => Ok(fixed_size_binary_binary::<i64>(
+                array.as_any().downcast_ref().unwrap(),
+                to_type.clone(),
+            )
+            .boxed()),
+            _ => Err(Error::NotYetImplemented(format!(
+                "Casting from {from_type:?} to {to_type:?} not supported",
+            ))),
+        },
+
+        (_, Binary) => match from_type {
+            UInt8 => primitive_to_binary_dyn::<u8, i32>(array),
+            UInt16 => primitive_to_binary_dyn::<u16, i32>(array),
+            UInt32 => primitive_to_binary_dyn::<u32, i32>(array),
+            UInt64 => primitive_to_binary_dyn::<u64, i32>(array),
+            Int8 => primitive_to_binary_dyn::<i8, i32>(array),
+            Int16 => primitive_to_binary_dyn::<i16, i32>(array),
+            Int32 => primitive_to_binary_dyn::<i32, i32>(array),
+            Int64 => primitive_to_binary_dyn::<i64, i32>(array),
+            Float32 => primitive_to_binary_dyn::<f32, i32>(array),
+            Float64 => primitive_to_binary_dyn::<f64, i32>(array),
+            _ => Err(Error::NotYetImplemented(format!(
+                "Casting from {from_type:?} to {to_type:?} not supported",
+            ))),
+        },
+
+        (_, LargeBinary) => match from_type {
+            UInt8 => primitive_to_binary_dyn::<u8, i64>(array),
+            UInt16 => primitive_to_binary_dyn::<u16, i64>(array),
+            UInt32 => primitive_to_binary_dyn::<u32, i64>(array),
+            UInt64 => primitive_to_binary_dyn::<u64, i64>(array),
+            Int8 => primitive_to_binary_dyn::<i8, i64>(array),
+            Int16 => primitive_to_binary_dyn::<i16, i64>(array),
+            Int32 => primitive_to_binary_dyn::<i32, i64>(array),
+            Int64 => primitive_to_binary_dyn::<i64, i64>(array),
+            Float32 => primitive_to_binary_dyn::<f32, i64>(array),
+            Float64 => primitive_to_binary_dyn::<f64, i64>(array),
+            _ => Err(Error::NotYetImplemented(format!(
+                "Casting from {from_type:?} to {to_type:?} not supported",
+            ))),
+        },
+
+        // start numeric casts
+        (UInt8, UInt16) => primitive_to_primitive_dyn::<u8, u16>(array, to_type, as_options),
+        (UInt8, UInt32) => primitive_to_primitive_dyn::<u8, u32>(array, to_type, as_options),
+        (UInt8, UInt64) => primitive_to_primitive_dyn::<u8, u64>(array, to_type, as_options),
+        (UInt8, Int8) => primitive_to_primitive_dyn::<u8, i8>(array, to_type, options),
+        (UInt8, Int16) => primitive_to_primitive_dyn::<u8, i16>(array, to_type, options),
+        (UInt8, Int32) => primitive_to_primitive_dyn::<u8, i32>(array, to_type, options),
+        (UInt8, Int64) => primitive_to_primitive_dyn::<u8, i64>(array, to_type, options),
+        (UInt8, Float32) => primitive_to_primitive_dyn::<u8, f32>(array, to_type, as_options),
+        (UInt8, Float64) => primitive_to_primitive_dyn::<u8, f64>(array, to_type, as_options),
+        (UInt8, Decimal(p, s)) => integer_to_decimal_dyn::<u8>(array, *p, *s),
+
+        (UInt16, UInt8) => primitive_to_primitive_dyn::<u16, u8>(array, to_type, options),
+        (UInt16, UInt32) => primitive_to_primitive_dyn::<u16, u32>(array, to_type, as_options),
+        (UInt16, UInt64) => primitive_to_primitive_dyn::<u16, u64>(array, to_type, as_options),
+        (UInt16, Int8) => primitive_to_primitive_dyn::<u16, i8>(array, to_type, options),
+        (UInt16, Int16) => primitive_to_primitive_dyn::<u16, i16>(array, to_type, options),
+        (UInt16, Int32) => primitive_to_primitive_dyn::<u16, i32>(array, to_type, options),
+        (UInt16, Int64) => primitive_to_primitive_dyn::<u16, i64>(array, to_type, options),
+        (UInt16, Float32) => primitive_to_primitive_dyn::<u16, f32>(array, to_type, as_options),
+        (UInt16, Float64) => primitive_to_primitive_dyn::<u16, f64>(array, to_type, as_options),
+        (UInt16, Decimal(p, s)) => integer_to_decimal_dyn::<u16>(array, *p, *s),
+
+        (UInt32, UInt8) => primitive_to_primitive_dyn::<u32, u8>(array, to_type, options),
+        (UInt32, UInt16) => primitive_to_primitive_dyn::<u32, u16>(array, to_type, options),
+        (UInt32, UInt64) => primitive_to_primitive_dyn::<u32, u64>(array, to_type, as_options),
+        (UInt32, Int8) => primitive_to_primitive_dyn::<u32, i8>(array, to_type, options),
+        (UInt32, Int16) => primitive_to_primitive_dyn::<u32, i16>(array, to_type, options),
+        (UInt32, Int32) => primitive_to_primitive_dyn::<u32, i32>(array, to_type, options),
+        (UInt32, Int64) => primitive_to_primitive_dyn::<u32, i64>(array, to_type, options),
+        (UInt32, Float32) => primitive_to_primitive_dyn::<u32, f32>(array, to_type, as_options),
+        (UInt32, Float64) => primitive_to_primitive_dyn::<u32, f64>(array, to_type, as_options),
+        (UInt32, Decimal(p, s)) => integer_to_decimal_dyn::<u32>(array, *p, *s),
+
+        (UInt64, UInt8) => primitive_to_primitive_dyn::<u64, u8>(array, to_type, options),
+        (UInt64, UInt16) => primitive_to_primitive_dyn::<u64, u16>(array, to_type, options),
+        (UInt64, UInt32) => primitive_to_primitive_dyn::<u64, u32>(array, to_type, options),
+        (UInt64, Int8) => primitive_to_primitive_dyn::<u64, i8>(array, to_type, options),
+        (UInt64, Int16) => primitive_to_primitive_dyn::<u64, i16>(array, to_type, options),
+        (UInt64, Int32) => primitive_to_primitive_dyn::<u64, i32>(array, to_type, options),
+        (UInt64, Int64) => primitive_to_primitive_dyn::<u64, i64>(array, to_type, options),
+        (UInt64, Float32) => primitive_to_primitive_dyn::<u64, f32>(array, to_type, as_options),
+        (UInt64, Float64) => primitive_to_primitive_dyn::<u64, f64>(array, to_type, as_options),
+        (UInt64, Decimal(p, s)) => integer_to_decimal_dyn::<u64>(array, *p, *s),
+
+        (Int8, UInt8) => primitive_to_primitive_dyn::<i8, u8>(array, to_type, options),
+        (Int8, UInt16) => primitive_to_primitive_dyn::<i8, u16>(array, to_type, options),
+        (Int8, UInt32) => primitive_to_primitive_dyn::<i8, u32>(array, to_type, options),
+        (Int8, UInt64) => primitive_to_primitive_dyn::<i8, u64>(array, to_type, options),
+        (Int8, Int16) => primitive_to_primitive_dyn::<i8, i16>(array, to_type, as_options),
+        (Int8, Int32) => primitive_to_primitive_dyn::<i8, i32>(array, to_type, as_options),
+        (Int8, Int64) => primitive_to_primitive_dyn::<i8, i64>(array, to_type, as_options),
+        (Int8, Float32) => primitive_to_primitive_dyn::<i8, f32>(array, to_type, as_options),
+        (Int8, Float64) => primitive_to_primitive_dyn::<i8, f64>(array, to_type, as_options),
+        (Int8, Decimal(p, s)) => integer_to_decimal_dyn::<i8>(array, *p, *s),
+
+        (Int16, UInt8) => primitive_to_primitive_dyn::<i16, u8>(array, to_type, options),
+        (Int16, UInt16) => primitive_to_primitive_dyn::<i16, u16>(array, to_type, options),
+        (Int16, UInt32) => primitive_to_primitive_dyn::<i16, u32>(array, to_type, options),
+        (Int16, UInt64) => primitive_to_primitive_dyn::<i16, u64>(array, to_type, options),
+        (Int16, Int8) => primitive_to_primitive_dyn::<i16, i8>(array, to_type, options),
+        (Int16, Int32) => primitive_to_primitive_dyn::<i16, i32>(array, to_type, as_options),
+        (Int16, Int64) => primitive_to_primitive_dyn::<i16, i64>(array, to_type, as_options),
+        (Int16, Float32) => primitive_to_primitive_dyn::<i16, f32>(array, to_type, as_options),
+        (Int16, Float64) => primitive_to_primitive_dyn::<i16, f64>(array, to_type, as_options),
+        (Int16, Decimal(p, s)) => integer_to_decimal_dyn::<i16>(array, *p, *s),
+
+        (Int32, UInt8) => primitive_to_primitive_dyn::<i32, u8>(array, to_type, options),
+        (Int32, UInt16) => primitive_to_primitive_dyn::<i32, u16>(array, to_type, options),
+        (Int32, UInt32) => primitive_to_primitive_dyn::<i32, u32>(array, to_type, options),
+        (Int32, UInt64) => primitive_to_primitive_dyn::<i32, u64>(array, to_type, options),
+        (Int32, Int8) => primitive_to_primitive_dyn::<i32, i8>(array, to_type, options),
+        (Int32, Int16) => primitive_to_primitive_dyn::<i32, i16>(array, to_type, options),
+        (Int32, Int64) => primitive_to_primitive_dyn::<i32, i64>(array, to_type, as_options),
+        (Int32, Float32) => primitive_to_primitive_dyn::<i32, f32>(array, to_type, as_options),
+        (Int32, Float64) => primitive_to_primitive_dyn::<i32, f64>(array, to_type, as_options),
+        (Int32, Decimal(p, s)) => integer_to_decimal_dyn::<i32>(array, *p, *s),
+
+        (Int64, UInt8) => primitive_to_primitive_dyn::<i64, u8>(array, to_type, options),
+        (Int64, UInt16) => primitive_to_primitive_dyn::<i64, u16>(array, to_type, options),
+        (Int64, UInt32) => primitive_to_primitive_dyn::<i64, u32>(array, to_type, options),
+        (Int64, UInt64) => primitive_to_primitive_dyn::<i64, u64>(array, to_type, options),
+        (Int64, Int8) => primitive_to_primitive_dyn::<i64, i8>(array, to_type, options),
+        (Int64, Int16) => primitive_to_primitive_dyn::<i64, i16>(array, to_type, options),
+        (Int64, Int32) => primitive_to_primitive_dyn::<i64, i32>(array, to_type, options),
+        (Int64, Float32) => primitive_to_primitive_dyn::<i64, f32>(array, to_type, options),
+        (Int64, Float64) => primitive_to_primitive_dyn::<i64, f64>(array, to_type, as_options),
+        (Int64, Decimal(p, s)) => integer_to_decimal_dyn::<i64>(array, *p, *s),
+
+        (Float16, Float32) => {
+            let from = array.as_any().downcast_ref().unwrap();
+            Ok(f16_to_f32(from).boxed())
+        },
+
+        (Float32, UInt8) => primitive_to_primitive_dyn::<f32, u8>(array, to_type, options),
+        (Float32, UInt16) => primitive_to_primitive_dyn::<f32, u16>(array, to_type, options),
+        (Float32, UInt32) => primitive_to_primitive_dyn::<f32, u32>(array, to_type, options),
+        (Float32, UInt64) => primitive_to_primitive_dyn::<f32, u64>(array, to_type, options),
+        (Float32, Int8) => primitive_to_primitive_dyn::<f32, i8>(array, to_type, options),
+        (Float32, Int16) => primitive_to_primitive_dyn::<f32, i16>(array, to_type, options),
+        (Float32, Int32) => primitive_to_primitive_dyn::<f32, i32>(array, to_type, options),
+        (Float32, Int64) => primitive_to_primitive_dyn::<f32, i64>(array, to_type, options),
+        (Float32, Float64) => primitive_to_primitive_dyn::<f32, f64>(array, to_type, as_options),
+        (Float32, Decimal(p, s)) => float_to_decimal_dyn::<f32>(array, *p, *s),
+
+        (Float64, UInt8) => primitive_to_primitive_dyn::<f64, u8>(array, to_type, options),
+        (Float64, UInt16) => primitive_to_primitive_dyn::<f64, u16>(array, to_type, options),
+        (Float64, UInt32) => primitive_to_primitive_dyn::<f64, u32>(array, to_type, options),
+        (Float64, UInt64) => primitive_to_primitive_dyn::<f64, u64>(array, to_type, options),
+        (Float64, Int8) => primitive_to_primitive_dyn::<f64, i8>(array, to_type, options),
+        (Float64, Int16) => primitive_to_primitive_dyn::<f64, i16>(array, to_type, options),
+        (Float64, Int32) => primitive_to_primitive_dyn::<f64, i32>(array, to_type, options),
+        (Float64, Int64) => primitive_to_primitive_dyn::<f64, i64>(array, to_type, options),
+        (Float64, Float32) => primitive_to_primitive_dyn::<f64, f32>(array, to_type, options),
+        (Float64, Decimal(p, s)) => float_to_decimal_dyn::<f64>(array, *p, *s),
+
+        (Decimal(_, _), UInt8) => decimal_to_integer_dyn::<u8>(array),
+        (Decimal(_, _), UInt16) => decimal_to_integer_dyn::<u16>(array),
+        (Decimal(_, _), UInt32) => decimal_to_integer_dyn::<u32>(array),
+        (Decimal(_, _), UInt64) => decimal_to_integer_dyn::<u64>(array),
+        (Decimal(_, _), Int8) => decimal_to_integer_dyn::<i8>(array),
+        (Decimal(_, _), Int16) => decimal_to_integer_dyn::<i16>(array),
+        (Decimal(_, _), Int32) => decimal_to_integer_dyn::<i32>(array),
+        (Decimal(_, _), Int64) => decimal_to_integer_dyn::<i64>(array),
+        (Decimal(_, _), Float32) => decimal_to_float_dyn::<f32>(array),
+        (Decimal(_, _), Float64) => decimal_to_float_dyn::<f64>(array),
+        (Decimal(_, _), Decimal(to_p, to_s)) => decimal_to_decimal_dyn(array, *to_p, *to_s),
+        // end numeric casts
+
+        // temporal casts
+        (Int32, Date32) => primitive_to_same_primitive_dyn::<i32>(array, to_type),
+        (Int32, Time32(TimeUnit::Second)) => primitive_to_same_primitive_dyn::<i32>(array, to_type),
+        (Int32, Time32(TimeUnit::Millisecond)) => {
+            primitive_to_same_primitive_dyn::<i32>(array, to_type)
+        },
+        // No support for microsecond/nanosecond with i32
+        (Date32, Int32) => primitive_to_same_primitive_dyn::<i32>(array, to_type),
+        (Date32, Int64) => primitive_to_primitive_dyn::<i32, i64>(array, to_type, options),
+        (Time32(_), Int32) => primitive_to_same_primitive_dyn::<i32>(array, to_type),
+        (Int64, Date64) => primitive_to_same_primitive_dyn::<i64>(array, to_type),
+        // No support for second/milliseconds with i64
+        (Int64, Time64(TimeUnit::Microsecond)) => {
+            primitive_to_same_primitive_dyn::<i64>(array, to_type)
+        },
+        (Int64, Time64(TimeUnit::Nanosecond)) => {
+            primitive_to_same_primitive_dyn::<i64>(array, to_type)
+        },
+
+        (Date64, Int32) => primitive_to_primitive_dyn::<i64, i32>(array, to_type, options),
+        (Date64, Int64) => primitive_to_same_primitive_dyn::<i64>(array, to_type),
+        (Time64(_), Int64) => primitive_to_same_primitive_dyn::<i64>(array, to_type),
+        (Date32, Date64) => primitive_dyn!(array, date32_to_date64),
+        (Date64, Date32) => primitive_dyn!(array, date64_to_date32),
+        (Time32(TimeUnit::Second), Time32(TimeUnit::Millisecond)) => {
+            primitive_dyn!(array, time32s_to_time32ms)
+        },
+        (Time32(TimeUnit::Millisecond), Time32(TimeUnit::Second)) => {
+            primitive_dyn!(array, time32ms_to_time32s)
+        },
+        (Time32(from_unit), Time64(to_unit)) => {
+            primitive_dyn!(array, time32_to_time64, *from_unit, *to_unit)
+        },
+        (Time64(TimeUnit::Microsecond), Time64(TimeUnit::Nanosecond)) => {
+            primitive_dyn!(array, time64us_to_time64ns)
+        },
+        (Time64(TimeUnit::Nanosecond), Time64(TimeUnit::Microsecond)) => {
+            primitive_dyn!(array, time64ns_to_time64us)
+        },
+        (Time64(from_unit), Time32(to_unit)) => {
+            primitive_dyn!(array, time64_to_time32, *from_unit, *to_unit)
+        },
+        (Timestamp(_, _), Int64) => primitive_to_same_primitive_dyn::<i64>(array, to_type),
+        (Int64, Timestamp(_, _)) => primitive_to_same_primitive_dyn::<i64>(array, to_type),
+        (Timestamp(from_unit, _), Timestamp(to_unit, tz)) => {
+            primitive_dyn!(array, timestamp_to_timestamp, *from_unit, *to_unit, tz)
+        },
+        (Timestamp(from_unit, _), Date32) => primitive_dyn!(array, timestamp_to_date32, *from_unit),
+        (Timestamp(from_unit, _), Date64) => primitive_dyn!(array, timestamp_to_date64, *from_unit),
+
+        (Int64, Duration(_)) => primitive_to_same_primitive_dyn::<i64>(array, to_type),
+        (Duration(_), Int64) => primitive_to_same_primitive_dyn::<i64>(array, to_type),
+
+        (Interval(IntervalUnit::DayTime), Interval(IntervalUnit::MonthDayNano)) => {
+            primitive_dyn!(array, days_ms_to_months_days_ns)
+        },
+        (Interval(IntervalUnit::YearMonth), Interval(IntervalUnit::MonthDayNano)) => {
+            primitive_dyn!(array, months_to_months_days_ns)
+        },
+
+        (_, _) => Err(Error::NotYetImplemented(format!(
+            "Casting from {from_type:?} to {to_type:?} not supported",
+        ))),
+    }
+}
+
+/// Attempts to encode an array into an `ArrayDictionary` with index
+/// type K and value (dictionary) type value_type
+///
+/// K is the key type
+fn cast_to_dictionary<K: DictionaryKey>(
+    array: &dyn Array,
+    dict_value_type: &DataType,
+    options: CastOptions,
+) -> Result<Box<dyn Array>> {
+    let array = cast(array, dict_value_type, options)?;
+    let array = array.as_ref();
+    match *dict_value_type {
+        DataType::Int8 => primitive_to_dictionary_dyn::<i8, K>(array),
+        DataType::Int16 => primitive_to_dictionary_dyn::<i16, K>(array),
+        DataType::Int32 => primitive_to_dictionary_dyn::<i32, K>(array),
+        DataType::Int64 => primitive_to_dictionary_dyn::<i64, K>(array),
+        DataType::UInt8 => primitive_to_dictionary_dyn::<u8, K>(array),
+        DataType::UInt16 => primitive_to_dictionary_dyn::<u16, K>(array),
+        DataType::UInt32 => primitive_to_dictionary_dyn::<u32, K>(array),
+        DataType::UInt64 => primitive_to_dictionary_dyn::<u64, K>(array),
+        DataType::Utf8 => utf8_to_dictionary_dyn::<i32, K>(array),
+        DataType::LargeUtf8 => utf8_to_dictionary_dyn::<i64, K>(array),
+        DataType::Binary => binary_to_dictionary_dyn::<i32, K>(array),
+        DataType::LargeBinary => binary_to_dictionary_dyn::<i64, K>(array),
+        _ => Err(Error::NotYetImplemented(format!(
+            "Unsupported output type for dictionary packing: {dict_value_type:?}"
+        ))),
+    }
+}
diff --git a/crates/nano-arrow/src/compute/cast/primitive_to.rs b/crates/nano-arrow/src/compute/cast/primitive_to.rs
new file mode 100644
index 000000000000..a83569ee165c
--- /dev/null
+++ b/crates/nano-arrow/src/compute/cast/primitive_to.rs
@@ -0,0 +1,584 @@
+use std::hash::Hash;
+
+use num_traits::{AsPrimitive, Float, ToPrimitive};
+
+use super::CastOptions;
+use crate::array::*;
+use crate::bitmap::Bitmap;
+use crate::compute::arity::unary;
+use crate::datatypes::{DataType, IntervalUnit, TimeUnit};
+use crate::error::Result;
+use crate::offset::{Offset, Offsets};
+use crate::temporal_conversions::*;
+use crate::types::{days_ms, f16, months_days_ns, NativeType};
+
+/// Returns a [`BinaryArray`] where every element is the binary representation of the number.
+pub fn primitive_to_binary<T: NativeType + lexical_core::ToLexical, O: Offset>(
+    from: &PrimitiveArray<T>,
+) -> BinaryArray<O> {
+    let mut values: Vec<u8> = Vec::with_capacity(from.len());
+    let mut offsets: Vec<O> = Vec::with_capacity(from.len() + 1);
+    offsets.push(O::default());
+
+    let mut offset: usize = 0;
+
+    unsafe {
+        for x in from.values().iter() {
+            values.reserve(offset + T::FORMATTED_SIZE_DECIMAL);
+
+            let bytes = std::slice::from_raw_parts_mut(
+                values.as_mut_ptr().add(offset),
+                values.capacity() - offset,
+            );
+            let len = lexical_core::write_unchecked(*x, bytes).len();
+
+            offset += len;
+            offsets.push(O::from_usize(offset).unwrap());
+        }
+        values.set_len(offset);
+        values.shrink_to_fit();
+        // Safety: offsets _are_ monotonically increasing
+        let offsets = unsafe { Offsets::new_unchecked(offsets) };
+        BinaryArray::<O>::new(
+            BinaryArray::<O>::default_data_type(),
+            offsets.into(),
+            values.into(),
+            from.validity().cloned(),
+        )
+    }
+}
+
+pub(super) fn primitive_to_binary_dyn<T, O>(from: &dyn Array) -> Result<Box<dyn Array>>
+where
+    O: Offset,
+    T: NativeType + lexical_core::ToLexical,
+{
+    let from = from.as_any().downcast_ref().unwrap();
+    Ok(Box::new(primitive_to_binary::<T, O>(from)))
+}
+
+/// Returns a [`BooleanArray`] where every element is different from zero.
+/// Validity is preserved.
+pub fn primitive_to_boolean<T: NativeType>(
+    from: &PrimitiveArray<T>,
+    to_type: DataType,
+) -> BooleanArray {
+    let iter = from.values().iter().map(|v| *v != T::default());
+    let values = Bitmap::from_trusted_len_iter(iter);
+
+    BooleanArray::new(to_type, values, from.validity().cloned())
+}
+
+pub(super) fn primitive_to_boolean_dyn<T>(
+    from: &dyn Array,
+    to_type: DataType,
+) -> Result<Box<dyn Array>>
+where
+    T: NativeType,
+{
+    let from = from.as_any().downcast_ref().unwrap();
+    Ok(Box::new(primitive_to_boolean::<T>(from, to_type)))
+}
+
+/// Returns a [`Utf8Array`] where every element is the utf8 representation of the number.
+pub fn primitive_to_utf8<T: NativeType + lexical_core::ToLexical, O: Offset>(
+    from: &PrimitiveArray<T>,
+) -> Utf8Array<O> {
+    let mut values: Vec<u8> = Vec::with_capacity(from.len());
+    let mut offsets: Vec<O> = Vec::with_capacity(from.len() + 1);
+    offsets.push(O::default());
+
+    let mut offset: usize = 0;
+
+    unsafe {
+        for x in from.values().iter() {
+            values.reserve(offset + T::FORMATTED_SIZE_DECIMAL);
+
+            let bytes = std::slice::from_raw_parts_mut(
+                values.as_mut_ptr().add(offset),
+                values.capacity() - offset,
+            );
+            let len = lexical_core::write_unchecked(*x, bytes).len();
+
+            offset += len;
+            offsets.push(O::from_usize(offset).unwrap());
+        }
+        values.set_len(offset);
+        values.shrink_to_fit();
+        // Safety: offsets _are_ monotonically increasing
+        let offsets = unsafe { Offsets::new_unchecked(offsets) };
+        Utf8Array::<O>::new_unchecked(
+            Utf8Array::<O>::default_data_type(),
+            offsets.into(),
+            values.into(),
+            from.validity().cloned(),
+        )
+    }
+}
+
+pub(super) fn primitive_to_utf8_dyn<T, O>(from: &dyn Array) -> Result<Box<dyn Array>>
+where
+    O: Offset,
+    T: NativeType + lexical_core::ToLexical,
+{
+    let from = from.as_any().downcast_ref().unwrap();
+    Ok(Box::new(primitive_to_utf8::<T, O>(from)))
+}
+
+pub(super) fn primitive_to_primitive_dyn<I, O>(
+    from: &dyn Array,
+    to_type: &DataType,
+    options: CastOptions,
+) -> Result<Box<dyn Array>>
+where
+    I: NativeType + num_traits::NumCast + num_traits::AsPrimitive<O>,
+    O: NativeType + num_traits::NumCast,
+{
+    let from = from.as_any().downcast_ref::<PrimitiveArray<I>>().unwrap();
+    if options.wrapped {
+        Ok(Box::new(primitive_as_primitive::<I, O>(from, to_type)))
+    } else {
+        Ok(Box::new(primitive_to_primitive::<I, O>(from, to_type)))
+    }
+}
+
+/// Cast [`PrimitiveArray`] to a [`PrimitiveArray`] of another physical type via numeric conversion.
+pub fn primitive_to_primitive<I, O>(
+    from: &PrimitiveArray<I>,
+    to_type: &DataType,
+) -> PrimitiveArray<O>
+where
+    I: NativeType + num_traits::NumCast,
+    O: NativeType + num_traits::NumCast,
+{
+    let iter = from
+        .iter()
+        .map(|v| v.and_then(|x| num_traits::cast::cast::<I, O>(*x)));
+    PrimitiveArray::<O>::from_trusted_len_iter(iter).to(to_type.clone())
+}
+
+/// Returns a [`PrimitiveArray<i128>`] with the casted values. Values are `None` on overflow
+pub fn integer_to_decimal<T: NativeType + AsPrimitive<i128>>(
+    from: &PrimitiveArray<T>,
+    to_precision: usize,
+    to_scale: usize,
+) -> PrimitiveArray<i128> {
+    let multiplier = 10_i128.pow(to_scale as u32);
+
+    let min_for_precision = 9_i128
+        .saturating_pow(1 + to_precision as u32)
+        .saturating_neg();
+    let max_for_precision = 9_i128.saturating_pow(1 + to_precision as u32);
+
+    let values = from.iter().map(|x| {
+        x.and_then(|x| {
+            x.as_().checked_mul(multiplier).and_then(|x| {
+                if x > max_for_precision || x < min_for_precision {
+                    None
+                } else {
+                    Some(x)
+                }
+            })
+        })
+    });
+
+    PrimitiveArray::<i128>::from_trusted_len_iter(values)
+        .to(DataType::Decimal(to_precision, to_scale))
+}
+
+pub(super) fn integer_to_decimal_dyn<T>(
+    from: &dyn Array,
+    precision: usize,
+    scale: usize,
+) -> Result<Box<dyn Array>>
+where
+    T: NativeType + AsPrimitive<i128>,
+{
+    let from = from.as_any().downcast_ref().unwrap();
+    Ok(Box::new(integer_to_decimal::<T>(from, precision, scale)))
+}
+
+/// Returns a [`PrimitiveArray<i128>`] with the casted values. Values are `None` on overflow
+pub fn float_to_decimal<T>(
+    from: &PrimitiveArray<T>,
+    to_precision: usize,
+    to_scale: usize,
+) -> PrimitiveArray<i128>
+where
+    T: NativeType + Float + ToPrimitive,
+    f64: AsPrimitive<T>,
+{
+    // 1.2 => 12
+    let multiplier: T = (10_f64).powi(to_scale as i32).as_();
+
+    let min_for_precision = 9_i128
+        .saturating_pow(1 + to_precision as u32)
+        .saturating_neg();
+    let max_for_precision = 9_i128.saturating_pow(1 + to_precision as u32);
+
+    let values = from.iter().map(|x| {
+        x.and_then(|x| {
+            let x = (*x * multiplier).to_i128().unwrap();
+            if x > max_for_precision || x < min_for_precision {
+                None
+            } else {
+                Some(x)
+            }
+        })
+    });
+
+    PrimitiveArray::<i128>::from_trusted_len_iter(values)
+        .to(DataType::Decimal(to_precision, to_scale))
+}
+
+pub(super) fn float_to_decimal_dyn<T>(
+    from: &dyn Array,
+    precision: usize,
+    scale: usize,
+) -> Result<Box<dyn Array>>
+where
+    T: NativeType + Float + ToPrimitive,
+    f64: AsPrimitive<T>,
+{
+    let from = from.as_any().downcast_ref().unwrap();
+    Ok(Box::new(float_to_decimal::<T>(from, precision, scale)))
+}
+
+/// Cast [`PrimitiveArray`] as a [`PrimitiveArray`]
+/// Same as `number as to_number_type` in rust
+pub fn primitive_as_primitive<I, O>(
+    from: &PrimitiveArray<I>,
+    to_type: &DataType,
+) -> PrimitiveArray<O>
+where
+    I: NativeType + num_traits::AsPrimitive<O>,
+    O: NativeType,
+{
+    unary(from, num_traits::AsPrimitive::<O>::as_, to_type.clone())
+}
+
+/// Cast [`PrimitiveArray`] to a [`PrimitiveArray`] of the same physical type.
+/// This is O(1).
+pub fn primitive_to_same_primitive<T>(
+    from: &PrimitiveArray<T>,
+    to_type: &DataType,
+) -> PrimitiveArray<T>
+where
+    T: NativeType,
+{
+    PrimitiveArray::<T>::new(
+        to_type.clone(),
+        from.values().clone(),
+        from.validity().cloned(),
+    )
+}
+
+/// Cast [`PrimitiveArray`] to a [`PrimitiveArray`] of the same physical type.
+/// This is O(1).
+pub(super) fn primitive_to_same_primitive_dyn<T>(
+    from: &dyn Array,
+    to_type: &DataType,
+) -> Result<Box<dyn Array>>
+where
+    T: NativeType,
+{
+    let from = from.as_any().downcast_ref().unwrap();
+    Ok(Box::new(primitive_to_same_primitive::<T>(from, to_type)))
+}
+
+pub(super) fn primitive_to_dictionary_dyn<T: NativeType + Eq + Hash, K: DictionaryKey>(
+    from: &dyn Array,
+) -> Result<Box<dyn Array>> {
+    let from = from.as_any().downcast_ref().unwrap();
+    primitive_to_dictionary::<T, K>(from).map(|x| Box::new(x) as Box<dyn Array>)
+}
+
+/// Cast [`PrimitiveArray`] to [`DictionaryArray`]. Also known as packing.
+/// # Errors
+/// This function errors if the maximum key is smaller than the number of distinct elements
+/// in the array.
+pub fn primitive_to_dictionary<T: NativeType + Eq + Hash, K: DictionaryKey>(
+    from: &PrimitiveArray<T>,
+) -> Result<DictionaryArray<K>> {
+    let iter = from.iter().map(|x| x.copied());
+    let mut array = MutableDictionaryArray::<K, _>::try_empty(MutablePrimitiveArray::<T>::from(
+        from.data_type().clone(),
+    ))?;
+    array.try_extend(iter)?;
+
+    Ok(array.into())
+}
+
+/// Get the time unit as a multiple of a second
+const fn time_unit_multiple(unit: TimeUnit) -> i64 {
+    match unit {
+        TimeUnit::Second => 1,
+        TimeUnit::Millisecond => MILLISECONDS,
+        TimeUnit::Microsecond => MICROSECONDS,
+        TimeUnit::Nanosecond => NANOSECONDS,
+    }
+}
+
+/// Conversion of dates
+pub fn date32_to_date64(from: &PrimitiveArray<i32>) -> PrimitiveArray<i64> {
+    unary(from, |x| x as i64 * MILLISECONDS_IN_DAY, DataType::Date64)
+}
+
+/// Conversion of dates
+pub fn date64_to_date32(from: &PrimitiveArray<i64>) -> PrimitiveArray<i32> {
+    unary(from, |x| (x / MILLISECONDS_IN_DAY) as i32, DataType::Date32)
+}
+
+/// Conversion of times
+pub fn time32s_to_time32ms(from: &PrimitiveArray<i32>) -> PrimitiveArray<i32> {
+    unary(from, |x| x * 1000, DataType::Time32(TimeUnit::Millisecond))
+}
+
+/// Conversion of times
+pub fn time32ms_to_time32s(from: &PrimitiveArray<i32>) -> PrimitiveArray<i32> {
+    unary(from, |x| x / 1000, DataType::Time32(TimeUnit::Second))
+}
+
+/// Conversion of times
+pub fn time64us_to_time64ns(from: &PrimitiveArray<i64>) -> PrimitiveArray<i64> {
+    unary(from, |x| x * 1000, DataType::Time64(TimeUnit::Nanosecond))
+}
+
+/// Conversion of times
+pub fn time64ns_to_time64us(from: &PrimitiveArray<i64>) -> PrimitiveArray<i64> {
+    unary(from, |x| x / 1000, DataType::Time64(TimeUnit::Microsecond))
+}
+
+/// Conversion of timestamp
+pub fn timestamp_to_date64(from: &PrimitiveArray<i64>, from_unit: TimeUnit) -> PrimitiveArray<i64> {
+    let from_size = time_unit_multiple(from_unit);
+    let to_size = MILLISECONDS;
+    let to_type = DataType::Date64;
+
+    // Scale time_array by (to_size / from_size) using a
+    // single integer operation, but need to avoid integer
+    // math rounding down to zero
+
+    match to_size.cmp(&from_size) {
+        std::cmp::Ordering::Less => unary(from, |x| (x / (from_size / to_size)), to_type),
+        std::cmp::Ordering::Equal => primitive_to_same_primitive(from, &to_type),
+        std::cmp::Ordering::Greater => unary(from, |x| (x * (to_size / from_size)), to_type),
+    }
+}
+
+/// Conversion of timestamp
+pub fn timestamp_to_date32(from: &PrimitiveArray<i64>, from_unit: TimeUnit) -> PrimitiveArray<i32> {
+    let from_size = time_unit_multiple(from_unit) * SECONDS_IN_DAY;
+    unary(from, |x| (x / from_size) as i32, DataType::Date32)
+}
+
+/// Conversion of time
+pub fn time32_to_time64(
+    from: &PrimitiveArray<i32>,
+    from_unit: TimeUnit,
+    to_unit: TimeUnit,
+) -> PrimitiveArray<i64> {
+    let from_size = time_unit_multiple(from_unit);
+    let to_size = time_unit_multiple(to_unit);
+    let divisor = to_size / from_size;
+    unary(from, |x| (x as i64 * divisor), DataType::Time64(to_unit))
+}
+
+/// Conversion of time
+pub fn time64_to_time32(
+    from: &PrimitiveArray<i64>,
+    from_unit: TimeUnit,
+    to_unit: TimeUnit,
+) -> PrimitiveArray<i32> {
+    let from_size = time_unit_multiple(from_unit);
+    let to_size = time_unit_multiple(to_unit);
+    let divisor = from_size / to_size;
+    unary(from, |x| (x / divisor) as i32, DataType::Time32(to_unit))
+}
+
+/// Conversion of timestamp
+pub fn timestamp_to_timestamp(
+    from: &PrimitiveArray<i64>,
+    from_unit: TimeUnit,
+    to_unit: TimeUnit,
+    tz: &Option<String>,
+) -> PrimitiveArray<i64> {
+    let from_size = time_unit_multiple(from_unit);
+    let to_size = time_unit_multiple(to_unit);
+    let to_type = DataType::Timestamp(to_unit, tz.clone());
+    // we either divide or multiply, depending on size of each unit
+    if from_size >= to_size {
+        unary(from, |x| (x / (from_size / to_size)), to_type)
+    } else {
+        unary(from, |x| (x * (to_size / from_size)), to_type)
+    }
+}
+
+fn timestamp_to_utf8_impl<O: Offset, T: chrono::TimeZone>(
+    from: &PrimitiveArray<i64>,
+    time_unit: TimeUnit,
+    timezone: T,
+) -> Utf8Array<O>
+where
+    T::Offset: std::fmt::Display,
+{
+    match time_unit {
+        TimeUnit::Nanosecond => {
+            let iter = from.iter().map(|x| {
+                x.map(|x| {
+                    let datetime = timestamp_ns_to_datetime(*x);
+                    let offset = timezone.offset_from_utc_datetime(&datetime);
+                    chrono::DateTime::<T>::from_naive_utc_and_offset(datetime, offset).to_rfc3339()
+                })
+            });
+            Utf8Array::from_trusted_len_iter(iter)
+        },
+        TimeUnit::Microsecond => {
+            let iter = from.iter().map(|x| {
+                x.map(|x| {
+                    let datetime = timestamp_us_to_datetime(*x);
+                    let offset = timezone.offset_from_utc_datetime(&datetime);
+                    chrono::DateTime::<T>::from_naive_utc_and_offset(datetime, offset).to_rfc3339()
+                })
+            });
+            Utf8Array::from_trusted_len_iter(iter)
+        },
+        TimeUnit::Millisecond => {
+            let iter = from.iter().map(|x| {
+                x.map(|x| {
+                    let datetime = timestamp_ms_to_datetime(*x);
+                    let offset = timezone.offset_from_utc_datetime(&datetime);
+                    chrono::DateTime::<T>::from_naive_utc_and_offset(datetime, offset).to_rfc3339()
+                })
+            });
+            Utf8Array::from_trusted_len_iter(iter)
+        },
+        TimeUnit::Second => {
+            let iter = from.iter().map(|x| {
+                x.map(|x| {
+                    let datetime = timestamp_s_to_datetime(*x);
+                    let offset = timezone.offset_from_utc_datetime(&datetime);
+                    chrono::DateTime::<T>::from_naive_utc_and_offset(datetime, offset).to_rfc3339()
+                })
+            });
+            Utf8Array::from_trusted_len_iter(iter)
+        },
+    }
+}
+
+#[cfg(feature = "chrono-tz")]
+#[cfg_attr(docsrs, doc(cfg(feature = "chrono-tz")))]
+fn chrono_tz_timestamp_to_utf8<O: Offset>(
+    from: &PrimitiveArray<i64>,
+    time_unit: TimeUnit,
+    timezone_str: &str,
+) -> Result<Utf8Array<O>> {
+    let timezone = parse_offset_tz(timezone_str)?;
+    Ok(timestamp_to_utf8_impl::<O, chrono_tz::Tz>(
+        from, time_unit, timezone,
+    ))
+}
+
+#[cfg(not(feature = "chrono-tz"))]
+fn chrono_tz_timestamp_to_utf8<O: Offset>(
+    _: &PrimitiveArray<i64>,
+    _: TimeUnit,
+    timezone_str: &str,
+) -> Result<Utf8Array<O>> {
+    use crate::error::Error;
+    Err(Error::InvalidArgumentError(format!(
+        "timezone \"{}\" cannot be parsed (feature chrono-tz is not active)",
+        timezone_str
+    )))
+}
+
+/// Returns a [`Utf8Array`] where every element is the utf8 representation of the timestamp in the rfc3339 format.
+pub fn timestamp_to_utf8<O: Offset>(
+    from: &PrimitiveArray<i64>,
+    time_unit: TimeUnit,
+    timezone_str: &str,
+) -> Result<Utf8Array<O>> {
+    let timezone = parse_offset(timezone_str);
+
+    if let Ok(timezone) = timezone {
+        Ok(timestamp_to_utf8_impl::<O, chrono::FixedOffset>(
+            from, time_unit, timezone,
+        ))
+    } else {
+        chrono_tz_timestamp_to_utf8(from, time_unit, timezone_str)
+    }
+}
+
+/// Returns a [`Utf8Array`] where every element is the utf8 representation of the timestamp in the rfc3339 format.
+pub fn naive_timestamp_to_utf8<O: Offset>(
+    from: &PrimitiveArray<i64>,
+    time_unit: TimeUnit,
+) -> Utf8Array<O> {
+    match time_unit {
+        TimeUnit::Nanosecond => {
+            let iter = from.iter().map(|x| {
+                x.copied()
+                    .map(timestamp_ns_to_datetime)
+                    .map(|x| x.to_string())
+            });
+            Utf8Array::from_trusted_len_iter(iter)
+        },
+        TimeUnit::Microsecond => {
+            let iter = from.iter().map(|x| {
+                x.copied()
+                    .map(timestamp_us_to_datetime)
+                    .map(|x| x.to_string())
+            });
+            Utf8Array::from_trusted_len_iter(iter)
+        },
+        TimeUnit::Millisecond => {
+            let iter = from.iter().map(|x| {
+                x.copied()
+                    .map(timestamp_ms_to_datetime)
+                    .map(|x| x.to_string())
+            });
+            Utf8Array::from_trusted_len_iter(iter)
+        },
+        TimeUnit::Second => {
+            let iter = from.iter().map(|x| {
+                x.copied()
+                    .map(timestamp_s_to_datetime)
+                    .map(|x| x.to_string())
+            });
+            Utf8Array::from_trusted_len_iter(iter)
+        },
+    }
+}
+
+#[inline]
+fn days_ms_to_months_days_ns_scalar(from: days_ms) -> months_days_ns {
+    months_days_ns::new(0, from.days(), from.milliseconds() as i64 * 1000)
+}
+
+/// Casts [`days_ms`]s to [`months_days_ns`]. This operation is infalible and lossless.
+pub fn days_ms_to_months_days_ns(from: &PrimitiveArray<days_ms>) -> PrimitiveArray<months_days_ns> {
+    unary(
+        from,
+        days_ms_to_months_days_ns_scalar,
+        DataType::Interval(IntervalUnit::MonthDayNano),
+    )
+}
+
+#[inline]
+fn months_to_months_days_ns_scalar(from: i32) -> months_days_ns {
+    months_days_ns::new(from, 0, 0)
+}
+
+/// Casts months represented as [`i32`]s to [`months_days_ns`]. This operation is infalible and lossless.
+pub fn months_to_months_days_ns(from: &PrimitiveArray<i32>) -> PrimitiveArray<months_days_ns> {
+    unary(
+        from,
+        months_to_months_days_ns_scalar,
+        DataType::Interval(IntervalUnit::MonthDayNano),
+    )
+}
+
+/// Casts f16 into f32
+pub fn f16_to_f32(from: &PrimitiveArray<f16>) -> PrimitiveArray<f32> {
+    unary(from, |x| x.to_f32(), DataType::Float32)
+}
diff --git a/crates/nano-arrow/src/compute/cast/utf8_to.rs b/crates/nano-arrow/src/compute/cast/utf8_to.rs
new file mode 100644
index 000000000000..9c86ff85da54
--- /dev/null
+++ b/crates/nano-arrow/src/compute/cast/utf8_to.rs
@@ -0,0 +1,176 @@
+use chrono::Datelike;
+
+use super::CastOptions;
+use crate::array::*;
+use crate::datatypes::DataType;
+use crate::error::Result;
+use crate::offset::Offset;
+use crate::temporal_conversions::{
+    utf8_to_naive_timestamp_ns as utf8_to_naive_timestamp_ns_,
+    utf8_to_timestamp_ns as utf8_to_timestamp_ns_, EPOCH_DAYS_FROM_CE,
+};
+use crate::types::NativeType;
+
+const RFC3339: &str = "%Y-%m-%dT%H:%M:%S%.f%:z";
+
+/// Casts a [`Utf8Array`] to a [`PrimitiveArray`], making any uncastable value a Null.
+pub fn utf8_to_primitive<O: Offset, T>(from: &Utf8Array<O>, to: &DataType) -> PrimitiveArray<T>
+where
+    T: NativeType + lexical_core::FromLexical,
+{
+    let iter = from
+        .iter()
+        .map(|x| x.and_then::<T, _>(|x| lexical_core::parse(x.as_bytes()).ok()));
+
+    PrimitiveArray::<T>::from_trusted_len_iter(iter).to(to.clone())
+}
+
+/// Casts a [`Utf8Array`] to a [`PrimitiveArray`] at best-effort using `lexical_core::parse_partial`, making any uncastable value as zero.
+pub fn partial_utf8_to_primitive<O: Offset, T>(
+    from: &Utf8Array<O>,
+    to: &DataType,
+) -> PrimitiveArray<T>
+where
+    T: NativeType + lexical_core::FromLexical,
+{
+    let iter = from.iter().map(|x| {
+        x.and_then::<T, _>(|x| lexical_core::parse_partial(x.as_bytes()).ok().map(|x| x.0))
+    });
+
+    PrimitiveArray::<T>::from_trusted_len_iter(iter).to(to.clone())
+}
+
+pub(super) fn utf8_to_primitive_dyn<O: Offset, T>(
+    from: &dyn Array,
+    to: &DataType,
+    options: CastOptions,
+) -> Result<Box<dyn Array>>
+where
+    T: NativeType + lexical_core::FromLexical,
+{
+    let from = from.as_any().downcast_ref().unwrap();
+    if options.partial {
+        Ok(Box::new(partial_utf8_to_primitive::<O, T>(from, to)))
+    } else {
+        Ok(Box::new(utf8_to_primitive::<O, T>(from, to)))
+    }
+}
+
+/// Casts a [`Utf8Array`] to a Date32 primitive, making any uncastable value a Null.
+pub fn utf8_to_date32<O: Offset>(from: &Utf8Array<O>) -> PrimitiveArray<i32> {
+    let iter = from.iter().map(|x| {
+        x.and_then(|x| {
+            x.parse::<chrono::NaiveDate>()
+                .ok()
+                .map(|x| x.num_days_from_ce() - EPOCH_DAYS_FROM_CE)
+        })
+    });
+    PrimitiveArray::<i32>::from_trusted_len_iter(iter).to(DataType::Date32)
+}
+
+pub(super) fn utf8_to_date32_dyn<O: Offset>(from: &dyn Array) -> Result<Box<dyn Array>> {
+    let from = from.as_any().downcast_ref().unwrap();
+    Ok(Box::new(utf8_to_date32::<O>(from)))
+}
+
+/// Casts a [`Utf8Array`] to a Date64 primitive, making any uncastable value a Null.
+pub fn utf8_to_date64<O: Offset>(from: &Utf8Array<O>) -> PrimitiveArray<i64> {
+    let iter = from.iter().map(|x| {
+        x.and_then(|x| {
+            x.parse::<chrono::NaiveDate>()
+                .ok()
+                .map(|x| (x.num_days_from_ce() - EPOCH_DAYS_FROM_CE) as i64 * 86400000)
+        })
+    });
+    PrimitiveArray::from_trusted_len_iter(iter).to(DataType::Date64)
+}
+
+pub(super) fn utf8_to_date64_dyn<O: Offset>(from: &dyn Array) -> Result<Box<dyn Array>> {
+    let from = from.as_any().downcast_ref().unwrap();
+    Ok(Box::new(utf8_to_date64::<O>(from)))
+}
+
+pub(super) fn utf8_to_dictionary_dyn<O: Offset, K: DictionaryKey>(
+    from: &dyn Array,
+) -> Result<Box<dyn Array>> {
+    let values = from.as_any().downcast_ref().unwrap();
+    utf8_to_dictionary::<O, K>(values).map(|x| Box::new(x) as Box<dyn Array>)
+}
+
+/// Cast [`Utf8Array`] to [`DictionaryArray`], also known as packing.
+/// # Errors
+/// This function errors if the maximum key is smaller than the number of distinct elements
+/// in the array.
+pub fn utf8_to_dictionary<O: Offset, K: DictionaryKey>(
+    from: &Utf8Array<O>,
+) -> Result<DictionaryArray<K>> {
+    let mut array = MutableDictionaryArray::<K, MutableUtf8Array<O>>::new();
+    array.try_extend(from.iter())?;
+
+    Ok(array.into())
+}
+
+pub(super) fn utf8_to_naive_timestamp_ns_dyn<O: Offset>(
+    from: &dyn Array,
+) -> Result<Box<dyn Array>> {
+    let from = from.as_any().downcast_ref().unwrap();
+    Ok(Box::new(utf8_to_naive_timestamp_ns::<O>(from)))
+}
+
+/// [`crate::temporal_conversions::utf8_to_timestamp_ns`] applied for RFC3339 formatting
+pub fn utf8_to_naive_timestamp_ns<O: Offset>(from: &Utf8Array<O>) -> PrimitiveArray<i64> {
+    utf8_to_naive_timestamp_ns_(from, RFC3339)
+}
+
+pub(super) fn utf8_to_timestamp_ns_dyn<O: Offset>(
+    from: &dyn Array,
+    timezone: String,
+) -> Result<Box<dyn Array>> {
+    let from = from.as_any().downcast_ref().unwrap();
+    utf8_to_timestamp_ns::<O>(from, timezone)
+        .map(Box::new)
+        .map(|x| x as Box<dyn Array>)
+}
+
+/// [`crate::temporal_conversions::utf8_to_timestamp_ns`] applied for RFC3339 formatting
+pub fn utf8_to_timestamp_ns<O: Offset>(
+    from: &Utf8Array<O>,
+    timezone: String,
+) -> Result<PrimitiveArray<i64>> {
+    utf8_to_timestamp_ns_(from, RFC3339, timezone)
+}
+
+/// Conversion of utf8
+pub fn utf8_to_large_utf8(from: &Utf8Array<i32>) -> Utf8Array<i64> {
+    let data_type = Utf8Array::<i64>::default_data_type();
+    let validity = from.validity().cloned();
+    let values = from.values().clone();
+
+    let offsets = from.offsets().into();
+    // Safety: sound because `values` fulfills the same invariants as `from.values()`
+    unsafe { Utf8Array::<i64>::new_unchecked(data_type, offsets, values, validity) }
+}
+
+/// Conversion of utf8
+pub fn utf8_large_to_utf8(from: &Utf8Array<i64>) -> Result<Utf8Array<i32>> {
+    let data_type = Utf8Array::<i32>::default_data_type();
+    let validity = from.validity().cloned();
+    let values = from.values().clone();
+    let offsets = from.offsets().try_into()?;
+
+    // Safety: sound because `values` fulfills the same invariants as `from.values()`
+    Ok(unsafe { Utf8Array::<i32>::new_unchecked(data_type, offsets, values, validity) })
+}
+
+/// Conversion to binary
+pub fn utf8_to_binary<O: Offset>(from: &Utf8Array<O>, to_data_type: DataType) -> BinaryArray<O> {
+    // Safety: erasure of an invariant is always safe
+    unsafe {
+        BinaryArray::<O>::new(
+            to_data_type,
+            from.offsets().clone(),
+            from.values().clone(),
+            from.validity().cloned(),
+        )
+    }
+}
diff --git a/crates/nano-arrow/src/compute/comparison/binary.rs b/crates/nano-arrow/src/compute/comparison/binary.rs
new file mode 100644
index 000000000000..af87362a7841
--- /dev/null
+++ b/crates/nano-arrow/src/compute/comparison/binary.rs
@@ -0,0 +1,238 @@
+//! Comparison functions for [`BinaryArray`]
+use super::super::utils::combine_validities;
+use crate::array::{BinaryArray, BooleanArray};
+use crate::bitmap::Bitmap;
+use crate::compute::comparison::{finish_eq_validities, finish_neq_validities};
+use crate::datatypes::DataType;
+use crate::offset::Offset;
+
+/// Evaluate `op(lhs, rhs)` for [`BinaryArray`]s using a specified
+/// comparison function.
+fn compare_op<O, F>(lhs: &BinaryArray<O>, rhs: &BinaryArray<O>, op: F) -> BooleanArray
+where
+    O: Offset,
+    F: Fn(&[u8], &[u8]) -> bool,
+{
+    assert_eq!(lhs.len(), rhs.len());
+
+    let validity = combine_validities(lhs.validity(), rhs.validity());
+
+    let values = lhs
+        .values_iter()
+        .zip(rhs.values_iter())
+        .map(|(lhs, rhs)| op(lhs, rhs));
+    let values = Bitmap::from_trusted_len_iter(values);
+
+    BooleanArray::new(DataType::Boolean, values, validity)
+}
+
+/// Evaluate `op(lhs, rhs)` for [`BinaryArray`] and scalar using
+/// a specified comparison function.
+fn compare_op_scalar<O, F>(lhs: &BinaryArray<O>, rhs: &[u8], op: F) -> BooleanArray
+where
+    O: Offset,
+    F: Fn(&[u8], &[u8]) -> bool,
+{
+    let validity = lhs.validity().cloned();
+
+    let values = lhs.values_iter().map(|lhs| op(lhs, rhs));
+    let values = Bitmap::from_trusted_len_iter(values);
+
+    BooleanArray::new(DataType::Boolean, values, validity)
+}
+
+/// Perform `lhs == rhs` operation on [`BinaryArray`].
+/// # Panic
+/// iff the arrays do not have the same length.
+pub fn eq<O: Offset>(lhs: &BinaryArray<O>, rhs: &BinaryArray<O>) -> BooleanArray {
+    compare_op(lhs, rhs, |a, b| a == b)
+}
+
+/// Perform `lhs == rhs` operation on [`BinaryArray`] and include validities in comparison.
+/// # Panic
+/// iff the arrays do not have the same length.
+pub fn eq_and_validity<O: Offset>(lhs: &BinaryArray<O>, rhs: &BinaryArray<O>) -> BooleanArray {
+    let validity_lhs = lhs.validity().cloned();
+    let validity_rhs = rhs.validity().cloned();
+    let lhs = lhs.clone().with_validity(None);
+    let rhs = rhs.clone().with_validity(None);
+    let out = compare_op(&lhs, &rhs, |a, b| a == b);
+
+    finish_eq_validities(out, validity_lhs, validity_rhs)
+}
+
+/// Perform `lhs == rhs` operation on [`BinaryArray`] and a scalar.
+pub fn eq_scalar<O: Offset>(lhs: &BinaryArray<O>, rhs: &[u8]) -> BooleanArray {
+    compare_op_scalar(lhs, rhs, |a, b| a == b)
+}
+
+/// Perform `lhs == rhs` operation on [`BinaryArray`] and a scalar and include validities in comparison.
+pub fn eq_scalar_and_validity<O: Offset>(lhs: &BinaryArray<O>, rhs: &[u8]) -> BooleanArray {
+    let validity = lhs.validity().cloned();
+    let lhs = lhs.clone().with_validity(None);
+    let out = compare_op_scalar(&lhs, rhs, |a, b| a == b);
+
+    finish_eq_validities(out, validity, None)
+}
+
+/// Perform `lhs != rhs` operation on [`BinaryArray`].
+/// # Panic
+/// iff the arrays do not have the same length.
+pub fn neq<O: Offset>(lhs: &BinaryArray<O>, rhs: &BinaryArray<O>) -> BooleanArray {
+    compare_op(lhs, rhs, |a, b| a != b)
+}
+
+/// Perform `lhs != rhs` operation on [`BinaryArray`].
+/// # Panic
+/// iff the arrays do not have the same length and include validities in comparison.
+pub fn neq_and_validity<O: Offset>(lhs: &BinaryArray<O>, rhs: &BinaryArray<O>) -> BooleanArray {
+    let validity_lhs = lhs.validity().cloned();
+    let validity_rhs = rhs.validity().cloned();
+    let lhs = lhs.clone().with_validity(None);
+    let rhs = rhs.clone().with_validity(None);
+
+    let out = compare_op(&lhs, &rhs, |a, b| a != b);
+    finish_neq_validities(out, validity_lhs, validity_rhs)
+}
+
+/// Perform `lhs != rhs` operation on [`BinaryArray`] and a scalar.
+pub fn neq_scalar<O: Offset>(lhs: &BinaryArray<O>, rhs: &[u8]) -> BooleanArray {
+    compare_op_scalar(lhs, rhs, |a, b| a != b)
+}
+
+/// Perform `lhs != rhs` operation on [`BinaryArray`] and a scalar and include validities in comparison.
+pub fn neq_scalar_and_validity<O: Offset>(lhs: &BinaryArray<O>, rhs: &[u8]) -> BooleanArray {
+    let validity = lhs.validity().cloned();
+    let lhs = lhs.clone().with_validity(None);
+    let out = compare_op_scalar(&lhs, rhs, |a, b| a != b);
+
+    finish_neq_validities(out, validity, None)
+}
+
+/// Perform `lhs < rhs` operation on [`BinaryArray`].
+pub fn lt<O: Offset>(lhs: &BinaryArray<O>, rhs: &BinaryArray<O>) -> BooleanArray {
+    compare_op(lhs, rhs, |a, b| a < b)
+}
+
+/// Perform `lhs < rhs` operation on [`BinaryArray`] and a scalar.
+pub fn lt_scalar<O: Offset>(lhs: &BinaryArray<O>, rhs: &[u8]) -> BooleanArray {
+    compare_op_scalar(lhs, rhs, |a, b| a < b)
+}
+
+/// Perform `lhs <= rhs` operation on [`BinaryArray`].
+pub fn lt_eq<O: Offset>(lhs: &BinaryArray<O>, rhs: &BinaryArray<O>) -> BooleanArray {
+    compare_op(lhs, rhs, |a, b| a <= b)
+}
+
+/// Perform `lhs <= rhs` operation on [`BinaryArray`] and a scalar.
+pub fn lt_eq_scalar<O: Offset>(lhs: &BinaryArray<O>, rhs: &[u8]) -> BooleanArray {
+    compare_op_scalar(lhs, rhs, |a, b| a <= b)
+}
+
+/// Perform `lhs > rhs` operation on [`BinaryArray`].
+pub fn gt<O: Offset>(lhs: &BinaryArray<O>, rhs: &BinaryArray<O>) -> BooleanArray {
+    compare_op(lhs, rhs, |a, b| a > b)
+}
+
+/// Perform `lhs > rhs` operation on [`BinaryArray`] and a scalar.
+pub fn gt_scalar<O: Offset>(lhs: &BinaryArray<O>, rhs: &[u8]) -> BooleanArray {
+    compare_op_scalar(lhs, rhs, |a, b| a > b)
+}
+
+/// Perform `lhs >= rhs` operation on [`BinaryArray`].
+pub fn gt_eq<O: Offset>(lhs: &BinaryArray<O>, rhs: &BinaryArray<O>) -> BooleanArray {
+    compare_op(lhs, rhs, |a, b| a >= b)
+}
+
+/// Perform `lhs >= rhs` operation on [`BinaryArray`] and a scalar.
+pub fn gt_eq_scalar<O: Offset>(lhs: &BinaryArray<O>, rhs: &[u8]) -> BooleanArray {
+    compare_op_scalar(lhs, rhs, |a, b| a >= b)
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    fn test_generic<O: Offset, F: Fn(&BinaryArray<O>, &BinaryArray<O>) -> BooleanArray>(
+        lhs: Vec<&[u8]>,
+        rhs: Vec<&[u8]>,
+        op: F,
+        expected: Vec<bool>,
+    ) {
+        let lhs = BinaryArray::<O>::from_slice(lhs);
+        let rhs = BinaryArray::<O>::from_slice(rhs);
+        let expected = BooleanArray::from_slice(expected);
+        assert_eq!(op(&lhs, &rhs), expected);
+    }
+
+    fn test_generic_scalar<O: Offset, F: Fn(&BinaryArray<O>, &[u8]) -> BooleanArray>(
+        lhs: Vec<&[u8]>,
+        rhs: &[u8],
+        op: F,
+        expected: Vec<bool>,
+    ) {
+        let lhs = BinaryArray::<O>::from_slice(lhs);
+        let expected = BooleanArray::from_slice(expected);
+        assert_eq!(op(&lhs, rhs), expected);
+    }
+
+    #[test]
+    fn test_gt_eq() {
+        test_generic::<i32, _>(
+            vec![b"arrow", b"datafusion", b"flight", b"parquet"],
+            vec![b"flight", b"flight", b"flight", b"flight"],
+            gt_eq,
+            vec![false, false, true, true],
+        )
+    }
+
+    #[test]
+    fn test_gt_eq_scalar() {
+        test_generic_scalar::<i32, _>(
+            vec![b"arrow", b"datafusion", b"flight", b"parquet"],
+            b"flight",
+            gt_eq_scalar,
+            vec![false, false, true, true],
+        )
+    }
+
+    #[test]
+    fn test_eq() {
+        test_generic::<i32, _>(
+            vec![b"arrow", b"arrow", b"arrow", b"arrow"],
+            vec![b"arrow", b"parquet", b"datafusion", b"flight"],
+            eq,
+            vec![true, false, false, false],
+        )
+    }
+
+    #[test]
+    fn test_eq_scalar() {
+        test_generic_scalar::<i32, _>(
+            vec![b"arrow", b"parquet", b"datafusion", b"flight"],
+            b"arrow",
+            eq_scalar,
+            vec![true, false, false, false],
+        )
+    }
+
+    #[test]
+    fn test_neq() {
+        test_generic::<i32, _>(
+            vec![b"arrow", b"arrow", b"arrow", b"arrow"],
+            vec![b"arrow", b"parquet", b"datafusion", b"flight"],
+            neq,
+            vec![false, true, true, true],
+        )
+    }
+
+    #[test]
+    fn test_neq_scalar() {
+        test_generic_scalar::<i32, _>(
+            vec![b"arrow", b"parquet", b"datafusion", b"flight"],
+            b"arrow",
+            neq_scalar,
+            vec![false, true, true, true],
+        )
+    }
+}
diff --git a/crates/nano-arrow/src/compute/comparison/boolean.rs b/crates/nano-arrow/src/compute/comparison/boolean.rs
new file mode 100644
index 000000000000..6b62f7fc6b00
--- /dev/null
+++ b/crates/nano-arrow/src/compute/comparison/boolean.rs
@@ -0,0 +1,172 @@
+//! Comparison functions for [`BooleanArray`]
+use super::super::utils::combine_validities;
+use crate::array::BooleanArray;
+use crate::bitmap::{binary, unary, Bitmap};
+use crate::compute::comparison::{finish_eq_validities, finish_neq_validities};
+use crate::datatypes::DataType;
+
+/// Evaluate `op(lhs, rhs)` for [`BooleanArray`]s using a specified
+/// comparison function.
+fn compare_op<F>(lhs: &BooleanArray, rhs: &BooleanArray, op: F) -> BooleanArray
+where
+    F: Fn(u64, u64) -> u64,
+{
+    assert_eq!(lhs.len(), rhs.len());
+    let validity = combine_validities(lhs.validity(), rhs.validity());
+
+    let values = binary(lhs.values(), rhs.values(), op);
+
+    BooleanArray::new(DataType::Boolean, values, validity)
+}
+
+/// Evaluate `op(left, right)` for [`BooleanArray`] and scalar using
+/// a specified comparison function.
+pub fn compare_op_scalar<F>(lhs: &BooleanArray, rhs: bool, op: F) -> BooleanArray
+where
+    F: Fn(u64, u64) -> u64,
+{
+    let rhs = if rhs { !0 } else { 0 };
+
+    let values = unary(lhs.values(), |x| op(x, rhs));
+    BooleanArray::new(DataType::Boolean, values, lhs.validity().cloned())
+}
+
+/// Perform `lhs == rhs` operation on two [`BooleanArray`]s.
+pub fn eq(lhs: &BooleanArray, rhs: &BooleanArray) -> BooleanArray {
+    compare_op(lhs, rhs, |a, b| !(a ^ b))
+}
+
+/// Perform `lhs == rhs` operation on two [`BooleanArray`]s and include validities in comparison.
+pub fn eq_and_validity(lhs: &BooleanArray, rhs: &BooleanArray) -> BooleanArray {
+    let validity_lhs = lhs.validity().cloned();
+    let validity_rhs = rhs.validity().cloned();
+    let lhs = lhs.clone().with_validity(None);
+    let rhs = rhs.clone().with_validity(None);
+    let out = compare_op(&lhs, &rhs, |a, b| !(a ^ b));
+
+    finish_eq_validities(out, validity_lhs, validity_rhs)
+}
+
+/// Perform `lhs == rhs` operation on a [`BooleanArray`] and a scalar value.
+pub fn eq_scalar(lhs: &BooleanArray, rhs: bool) -> BooleanArray {
+    if rhs {
+        lhs.clone()
+    } else {
+        compare_op_scalar(lhs, rhs, |a, _| !a)
+    }
+}
+
+/// Perform `lhs == rhs` operation on a [`BooleanArray`] and a scalar value and include validities in comparison.
+pub fn eq_scalar_and_validity(lhs: &BooleanArray, rhs: bool) -> BooleanArray {
+    let validity = lhs.validity().cloned();
+    let lhs = lhs.clone().with_validity(None);
+    if rhs {
+        finish_eq_validities(lhs, validity, None)
+    } else {
+        let lhs = lhs.with_validity(None);
+
+        let out = compare_op_scalar(&lhs, rhs, |a, _| !a);
+
+        finish_eq_validities(out, validity, None)
+    }
+}
+
+/// `lhs != rhs` for [`BooleanArray`]
+pub fn neq(lhs: &BooleanArray, rhs: &BooleanArray) -> BooleanArray {
+    compare_op(lhs, rhs, |a, b| a ^ b)
+}
+
+/// `lhs != rhs` for [`BooleanArray`] and include validities in comparison.
+pub fn neq_and_validity(lhs: &BooleanArray, rhs: &BooleanArray) -> BooleanArray {
+    let validity_lhs = lhs.validity().cloned();
+    let validity_rhs = rhs.validity().cloned();
+    let lhs = lhs.clone().with_validity(None);
+    let rhs = rhs.clone().with_validity(None);
+    let out = compare_op(&lhs, &rhs, |a, b| a ^ b);
+
+    finish_neq_validities(out, validity_lhs, validity_rhs)
+}
+
+/// Perform `left != right` operation on an array and a scalar value.
+pub fn neq_scalar(lhs: &BooleanArray, rhs: bool) -> BooleanArray {
+    eq_scalar(lhs, !rhs)
+}
+
+/// Perform `left != right` operation on an array and a scalar value.
+pub fn neq_scalar_and_validity(lhs: &BooleanArray, rhs: bool) -> BooleanArray {
+    let validity = lhs.validity().cloned();
+    let lhs = lhs.clone().with_validity(None);
+    let out = eq_scalar(&lhs, !rhs);
+    finish_neq_validities(out, validity, None)
+}
+
+/// Perform `left < right` operation on two arrays.
+pub fn lt(lhs: &BooleanArray, rhs: &BooleanArray) -> BooleanArray {
+    compare_op(lhs, rhs, |a, b| !a & b)
+}
+
+/// Perform `left < right` operation on an array and a scalar value.
+pub fn lt_scalar(lhs: &BooleanArray, rhs: bool) -> BooleanArray {
+    if rhs {
+        compare_op_scalar(lhs, rhs, |a, _| !a)
+    } else {
+        BooleanArray::new(
+            DataType::Boolean,
+            Bitmap::new_zeroed(lhs.len()),
+            lhs.validity().cloned(),
+        )
+    }
+}
+
+/// Perform `left <= right` operation on two arrays.
+pub fn lt_eq(lhs: &BooleanArray, rhs: &BooleanArray) -> BooleanArray {
+    compare_op(lhs, rhs, |a, b| !a | b)
+}
+
+/// Perform `left <= right` operation on an array and a scalar value.
+/// Null values are less than non-null values.
+pub fn lt_eq_scalar(lhs: &BooleanArray, rhs: bool) -> BooleanArray {
+    if rhs {
+        let all_ones = !0;
+        compare_op_scalar(lhs, rhs, |_, _| all_ones)
+    } else {
+        compare_op_scalar(lhs, rhs, |a, _| !a)
+    }
+}
+
+/// Perform `left > right` operation on two arrays. Non-null values are greater than null
+/// values.
+pub fn gt(lhs: &BooleanArray, rhs: &BooleanArray) -> BooleanArray {
+    compare_op(lhs, rhs, |a, b| a & !b)
+}
+
+/// Perform `left > right` operation on an array and a scalar value.
+/// Non-null values are greater than null values.
+pub fn gt_scalar(lhs: &BooleanArray, rhs: bool) -> BooleanArray {
+    if rhs {
+        BooleanArray::new(
+            DataType::Boolean,
+            Bitmap::new_zeroed(lhs.len()),
+            lhs.validity().cloned(),
+        )
+    } else {
+        lhs.clone()
+    }
+}
+
+/// Perform `left >= right` operation on two arrays. Non-null values are greater than null
+/// values.
+pub fn gt_eq(lhs: &BooleanArray, rhs: &BooleanArray) -> BooleanArray {
+    compare_op(lhs, rhs, |a, b| a | !b)
+}
+
+/// Perform `left >= right` operation on an array and a scalar value.
+/// Non-null values are greater than null values.
+pub fn gt_eq_scalar(lhs: &BooleanArray, rhs: bool) -> BooleanArray {
+    if rhs {
+        lhs.clone()
+    } else {
+        let all_ones = !0;
+        compare_op_scalar(lhs, rhs, |_, _| all_ones)
+    }
+}
diff --git a/crates/nano-arrow/src/compute/comparison/mod.rs b/crates/nano-arrow/src/compute/comparison/mod.rs
new file mode 100644
index 000000000000..96627ef2a5e1
--- /dev/null
+++ b/crates/nano-arrow/src/compute/comparison/mod.rs
@@ -0,0 +1,613 @@
+//! Contains comparison operators
+//!
+//! The module contains functions that compare either an [`Array`] and a [`Scalar`]
+//! or two [`Array`]s (of the same [`DataType`]). The scalar-oriented functions are
+//! suffixed with `_scalar`.
+//!
+//! The functions are organized in two variants:
+//! * statically typed
+//! * dynamically typed
+//! The statically typed are available under each module of this module (e.g. [`primitive::eq`], [`primitive::lt_scalar`])
+//! The dynamically typed are available in this module (e.g. [`eq`] or [`lt_scalar`]).
+//!
+//! # Examples
+//!
+//! Compare two [`PrimitiveArray`]s:
+//! ```
+//! use arrow2::array::{BooleanArray, PrimitiveArray};
+//! use arrow2::compute::comparison::primitive::gt;
+//!
+//! let array1 = PrimitiveArray::<i32>::from([Some(1), None, Some(2)]);
+//! let array2 = PrimitiveArray::<i32>::from([Some(1), Some(3), Some(1)]);
+//! let result = gt(&array1, &array2);
+//! assert_eq!(result, BooleanArray::from([Some(false), None, Some(true)]));
+//! ```
+//!
+//! Compare two dynamically-typed [`Array`]s (trait objects):
+//! ```
+//! use arrow2::array::{Array, BooleanArray, PrimitiveArray};
+//! use arrow2::compute::comparison::eq;
+//!
+//! let array1: &dyn Array = &PrimitiveArray::<f64>::from(&[Some(10.0), None, Some(20.0)]);
+//! let array2: &dyn Array = &PrimitiveArray::<f64>::from(&[Some(10.0), None, Some(10.0)]);
+//! let result = eq(array1, array2);
+//! assert_eq!(result, BooleanArray::from([Some(true), None, Some(false)]));
+//! ```
+//!
+//! Compare (not equal) a [`Utf8Array`] to a word:
+//! ```
+//! use arrow2::array::{BooleanArray, Utf8Array};
+//! use arrow2::compute::comparison::utf8::neq_scalar;
+//!
+//! let array = Utf8Array::<i32>::from([Some("compute"), None, Some("compare")]);
+//! let result = neq_scalar(&array, "compare");
+//! assert_eq!(result, BooleanArray::from([Some(true), None, Some(false)]));
+//! ```
+
+use crate::array::*;
+use crate::datatypes::{DataType, IntervalUnit};
+use crate::scalar::*;
+
+pub mod binary;
+pub mod boolean;
+pub mod primitive;
+pub mod utf8;
+
+mod simd;
+pub use simd::{Simd8, Simd8Lanes, Simd8PartialEq, Simd8PartialOrd};
+
+use super::take::take_boolean;
+use crate::bitmap::{binary, Bitmap};
+use crate::compute;
+
+macro_rules! match_eq_ord {(
+    $key_type:expr, | $_:tt $T:ident | $($body:tt)*
+) => ({
+    macro_rules! __with_ty__ {( $_ $T:ident ) => ( $($body)* )}
+    use crate::datatypes::PrimitiveType::*;
+    use crate::types::i256;
+    match $key_type {
+        Int8 => __with_ty__! { i8 },
+        Int16 => __with_ty__! { i16 },
+        Int32 => __with_ty__! { i32 },
+        Int64 => __with_ty__! { i64 },
+        Int128 => __with_ty__! { i128 },
+        Int256 => __with_ty__! { i256 },
+        DaysMs => todo!(),
+        MonthDayNano => todo!(),
+        UInt8 => __with_ty__! { u8 },
+        UInt16 => __with_ty__! { u16 },
+        UInt32 => __with_ty__! { u32 },
+        UInt64 => __with_ty__! { u64 },
+        Float16 => todo!(),
+        Float32 => __with_ty__! { f32 },
+        Float64 => __with_ty__! { f64 },
+    }
+})}
+
+macro_rules! match_eq {(
+    $key_type:expr, | $_:tt $T:ident | $($body:tt)*
+) => ({
+    macro_rules! __with_ty__ {( $_ $T:ident ) => ( $($body)* )}
+    use crate::datatypes::PrimitiveType::*;
+    use crate::types::{days_ms, months_days_ns, f16, i256};
+    match $key_type {
+        Int8 => __with_ty__! { i8 },
+        Int16 => __with_ty__! { i16 },
+        Int32 => __with_ty__! { i32 },
+        Int64 => __with_ty__! { i64 },
+        Int128 => __with_ty__! { i128 },
+        Int256 => __with_ty__! { i256 },
+        DaysMs => __with_ty__! { days_ms },
+        MonthDayNano => __with_ty__! { months_days_ns },
+        UInt8 => __with_ty__! { u8 },
+        UInt16 => __with_ty__! { u16 },
+        UInt32 => __with_ty__! { u32 },
+        UInt64 => __with_ty__! { u64 },
+        Float16 => __with_ty__! { f16 },
+        Float32 => __with_ty__! { f32 },
+        Float64 => __with_ty__! { f64 },
+    }
+})}
+
+macro_rules! compare {
+    ($lhs:expr, $rhs:expr, $op:tt, $p:tt) => {{
+        let lhs = $lhs;
+        let rhs = $rhs;
+        assert_eq!(
+            lhs.data_type().to_logical_type(),
+            rhs.data_type().to_logical_type()
+        );
+
+        use crate::datatypes::PhysicalType::*;
+        match lhs.data_type().to_physical_type() {
+            Boolean => {
+                let lhs = lhs.as_any().downcast_ref().unwrap();
+                let rhs = rhs.as_any().downcast_ref().unwrap();
+                boolean::$op(lhs, rhs)
+            },
+            Primitive(primitive) => $p!(primitive, |$T| {
+                let lhs = lhs.as_any().downcast_ref().unwrap();
+                let rhs = rhs.as_any().downcast_ref().unwrap();
+                primitive::$op::<$T>(lhs, rhs)
+            }),
+            LargeUtf8 => {
+                let lhs = lhs.as_any().downcast_ref().unwrap();
+                let rhs = rhs.as_any().downcast_ref().unwrap();
+                utf8::$op::<i64>(lhs, rhs)
+            },
+            LargeBinary => {
+                let lhs = lhs.as_any().downcast_ref().unwrap();
+                let rhs = rhs.as_any().downcast_ref().unwrap();
+                binary::$op::<i64>(lhs, rhs)
+            },
+            _ => todo!(
+                "Comparison between {:?} are not yet supported",
+                lhs.data_type()
+            ),
+        }
+    }};
+}
+
+/// `==` between two [`Array`]s.
+/// Use [`can_eq`] to check whether the operation is valid
+/// # Panic
+/// Panics iff either:
+/// * the arrays do not have have the same logical type
+/// * the arrays do not have the same length
+/// * the operation is not supported for the logical type
+pub fn eq(lhs: &dyn Array, rhs: &dyn Array) -> BooleanArray {
+    compare!(lhs, rhs, eq, match_eq)
+}
+
+/// `==` between two [`Array`]s and includes validities in comparison.
+/// Use [`can_eq`] to check whether the operation is valid
+/// # Panic
+/// Panics iff either:
+/// * the arrays do not have have the same logical type
+/// * the arrays do not have the same length
+/// * the operation is not supported for the logical type
+pub fn eq_and_validity(lhs: &dyn Array, rhs: &dyn Array) -> BooleanArray {
+    compare!(lhs, rhs, eq_and_validity, match_eq)
+}
+
+/// Returns whether a [`DataType`] is comparable is supported by [`eq`].
+pub fn can_eq(data_type: &DataType) -> bool {
+    can_partial_eq(data_type)
+}
+
+/// `!=` between two [`Array`]s.
+/// Use [`can_neq`] to check whether the operation is valid
+/// # Panic
+/// Panics iff either:
+/// * the arrays do not have have the same logical type
+/// * the arrays do not have the same length
+/// * the operation is not supported for the logical type
+pub fn neq(lhs: &dyn Array, rhs: &dyn Array) -> BooleanArray {
+    compare!(lhs, rhs, neq, match_eq)
+}
+
+/// `!=` between two [`Array`]s and includes validities in comparison.
+/// Use [`can_neq`] to check whether the operation is valid
+/// # Panic
+/// Panics iff either:
+/// * the arrays do not have have the same logical type
+/// * the arrays do not have the same length
+/// * the operation is not supported for the logical type
+pub fn neq_and_validity(lhs: &dyn Array, rhs: &dyn Array) -> BooleanArray {
+    compare!(lhs, rhs, neq_and_validity, match_eq)
+}
+
+/// Returns whether a [`DataType`] is comparable is supported by [`neq`].
+pub fn can_neq(data_type: &DataType) -> bool {
+    can_partial_eq(data_type)
+}
+
+/// `<` between two [`Array`]s.
+/// Use [`can_lt`] to check whether the operation is valid
+/// # Panic
+/// Panics iff either:
+/// * the arrays do not have have the same logical type
+/// * the arrays do not have the same length
+/// * the operation is not supported for the logical type
+pub fn lt(lhs: &dyn Array, rhs: &dyn Array) -> BooleanArray {
+    compare!(lhs, rhs, lt, match_eq_ord)
+}
+
+/// Returns whether a [`DataType`] is comparable is supported by [`lt`].
+pub fn can_lt(data_type: &DataType) -> bool {
+    can_partial_eq_and_ord(data_type)
+}
+
+/// `<=` between two [`Array`]s.
+/// Use [`can_lt_eq`] to check whether the operation is valid
+/// # Panic
+/// Panics iff either:
+/// * the arrays do not have have the same logical type
+/// * the arrays do not have the same length
+/// * the operation is not supported for the logical type
+pub fn lt_eq(lhs: &dyn Array, rhs: &dyn Array) -> BooleanArray {
+    compare!(lhs, rhs, lt_eq, match_eq_ord)
+}
+
+/// Returns whether a [`DataType`] is comparable is supported by [`lt`].
+pub fn can_lt_eq(data_type: &DataType) -> bool {
+    can_partial_eq_and_ord(data_type)
+}
+
+/// `>` between two [`Array`]s.
+/// Use [`can_gt`] to check whether the operation is valid
+/// # Panic
+/// Panics iff either:
+/// * the arrays do not have have the same logical type
+/// * the arrays do not have the same length
+/// * the operation is not supported for the logical type
+pub fn gt(lhs: &dyn Array, rhs: &dyn Array) -> BooleanArray {
+    compare!(lhs, rhs, gt, match_eq_ord)
+}
+
+/// Returns whether a [`DataType`] is comparable is supported by [`gt`].
+pub fn can_gt(data_type: &DataType) -> bool {
+    can_partial_eq_and_ord(data_type)
+}
+
+/// `>=` between two [`Array`]s.
+/// Use [`can_gt_eq`] to check whether the operation is valid
+/// # Panic
+/// Panics iff either:
+/// * the arrays do not have have the same logical type
+/// * the arrays do not have the same length
+/// * the operation is not supported for the logical type
+pub fn gt_eq(lhs: &dyn Array, rhs: &dyn Array) -> BooleanArray {
+    compare!(lhs, rhs, gt_eq, match_eq_ord)
+}
+
+/// Returns whether a [`DataType`] is comparable is supported by [`gt_eq`].
+pub fn can_gt_eq(data_type: &DataType) -> bool {
+    can_partial_eq_and_ord(data_type)
+}
+
+macro_rules! compare_scalar {
+    ($lhs:expr, $rhs:expr, $op:tt, $p:tt) => {{
+        let lhs = $lhs;
+        let rhs = $rhs;
+        assert_eq!(
+            lhs.data_type().to_logical_type(),
+            rhs.data_type().to_logical_type()
+        );
+        if !rhs.is_valid() {
+            return BooleanArray::new_null(DataType::Boolean, lhs.len());
+        }
+
+        use crate::datatypes::PhysicalType::*;
+        match lhs.data_type().to_physical_type() {
+            Boolean => {
+                let lhs = lhs.as_any().downcast_ref().unwrap();
+                let rhs = rhs.as_any().downcast_ref::<BooleanScalar>().unwrap();
+                // validity checked above
+                boolean::$op(lhs, rhs.value().unwrap())
+            },
+            Primitive(primitive) => $p!(primitive, |$T| {
+                let lhs = lhs.as_any().downcast_ref().unwrap();
+                let rhs = rhs.as_any().downcast_ref::<PrimitiveScalar<$T>>().unwrap();
+                primitive::$op::<$T>(lhs, rhs.value().unwrap())
+            }),
+            LargeUtf8 => {
+                let lhs = lhs.as_any().downcast_ref().unwrap();
+                let rhs = rhs.as_any().downcast_ref::<Utf8Scalar<i64>>().unwrap();
+                utf8::$op::<i64>(lhs, rhs.value().unwrap())
+            },
+            LargeBinary => {
+                let lhs = lhs.as_any().downcast_ref().unwrap();
+                let rhs = rhs.as_any().downcast_ref::<BinaryScalar<i64>>().unwrap();
+                binary::$op::<i64>(lhs, rhs.value().unwrap())
+            },
+            Dictionary(key_type) => {
+                match_integer_type!(key_type, |$T| {
+                    let lhs = lhs.as_any().downcast_ref::<DictionaryArray<$T>>().unwrap();
+                    let values = $op(lhs.values().as_ref(), rhs);
+
+                    take_boolean(&values, lhs.keys())
+                })
+            },
+            _ => todo!("Comparisons of {:?} are not yet supported", lhs.data_type()),
+        }
+    }};
+}
+
+/// `==` between an [`Array`] and a [`Scalar`].
+/// Use [`can_eq_scalar`] to check whether the operation is valid
+/// # Panic
+/// Panics iff either:
+/// * they do not have have the same logical type
+/// * the operation is not supported for the logical type
+pub fn eq_scalar(lhs: &dyn Array, rhs: &dyn Scalar) -> BooleanArray {
+    compare_scalar!(lhs, rhs, eq_scalar, match_eq)
+}
+
+/// `==` between an [`Array`] and a [`Scalar`] and includes validities in comparison.
+/// Use [`can_eq_scalar`] to check whether the operation is valid
+/// # Panic
+/// Panics iff either:
+/// * they do not have have the same logical type
+/// * the operation is not supported for the logical type
+pub fn eq_scalar_and_validity(lhs: &dyn Array, rhs: &dyn Scalar) -> BooleanArray {
+    compare_scalar!(lhs, rhs, eq_scalar_and_validity, match_eq)
+}
+
+/// Returns whether a [`DataType`] is supported by [`eq_scalar`].
+pub fn can_eq_scalar(data_type: &DataType) -> bool {
+    can_partial_eq_scalar(data_type)
+}
+
+/// `!=` between an [`Array`] and a [`Scalar`].
+/// Use [`can_neq_scalar`] to check whether the operation is valid
+/// # Panic
+/// Panics iff either:
+/// * they do not have have the same logical type
+/// * the operation is not supported for the logical type
+pub fn neq_scalar(lhs: &dyn Array, rhs: &dyn Scalar) -> BooleanArray {
+    compare_scalar!(lhs, rhs, neq_scalar, match_eq)
+}
+
+/// `!=` between an [`Array`] and a [`Scalar`] and includes validities in comparison.
+/// Use [`can_neq_scalar`] to check whether the operation is valid
+/// # Panic
+/// Panics iff either:
+/// * they do not have have the same logical type
+/// * the operation is not supported for the logical type
+pub fn neq_scalar_and_validity(lhs: &dyn Array, rhs: &dyn Scalar) -> BooleanArray {
+    compare_scalar!(lhs, rhs, neq_scalar_and_validity, match_eq)
+}
+
+/// Returns whether a [`DataType`] is supported by [`neq_scalar`].
+pub fn can_neq_scalar(data_type: &DataType) -> bool {
+    can_partial_eq_scalar(data_type)
+}
+
+/// `<` between an [`Array`] and a [`Scalar`].
+/// Use [`can_lt_scalar`] to check whether the operation is valid
+/// # Panic
+/// Panics iff either:
+/// * they do not have have the same logical type
+/// * the operation is not supported for the logical type
+pub fn lt_scalar(lhs: &dyn Array, rhs: &dyn Scalar) -> BooleanArray {
+    compare_scalar!(lhs, rhs, lt_scalar, match_eq_ord)
+}
+
+/// Returns whether a [`DataType`] is supported by [`lt_scalar`].
+pub fn can_lt_scalar(data_type: &DataType) -> bool {
+    can_partial_eq_and_ord_scalar(data_type)
+}
+
+/// `<=` between an [`Array`] and a [`Scalar`].
+/// Use [`can_lt_eq_scalar`] to check whether the operation is valid
+/// # Panic
+/// Panics iff either:
+/// * they do not have have the same logical type
+/// * the operation is not supported for the logical type
+pub fn lt_eq_scalar(lhs: &dyn Array, rhs: &dyn Scalar) -> BooleanArray {
+    compare_scalar!(lhs, rhs, lt_eq_scalar, match_eq_ord)
+}
+
+/// Returns whether a [`DataType`] is supported by [`lt_eq_scalar`].
+pub fn can_lt_eq_scalar(data_type: &DataType) -> bool {
+    can_partial_eq_and_ord_scalar(data_type)
+}
+
+/// `>` between an [`Array`] and a [`Scalar`].
+/// Use [`can_gt_scalar`] to check whether the operation is valid
+/// # Panic
+/// Panics iff either:
+/// * they do not have have the same logical type
+/// * the operation is not supported for the logical type
+pub fn gt_scalar(lhs: &dyn Array, rhs: &dyn Scalar) -> BooleanArray {
+    compare_scalar!(lhs, rhs, gt_scalar, match_eq_ord)
+}
+
+/// Returns whether a [`DataType`] is supported by [`gt_scalar`].
+pub fn can_gt_scalar(data_type: &DataType) -> bool {
+    can_partial_eq_and_ord_scalar(data_type)
+}
+
+/// `>=` between an [`Array`] and a [`Scalar`].
+/// Use [`can_gt_eq_scalar`] to check whether the operation is valid
+/// # Panic
+/// Panics iff either:
+/// * they do not have have the same logical type
+/// * the operation is not supported for the logical type
+pub fn gt_eq_scalar(lhs: &dyn Array, rhs: &dyn Scalar) -> BooleanArray {
+    compare_scalar!(lhs, rhs, gt_eq_scalar, match_eq_ord)
+}
+
+/// Returns whether a [`DataType`] is supported by [`gt_eq_scalar`].
+pub fn can_gt_eq_scalar(data_type: &DataType) -> bool {
+    can_partial_eq_and_ord_scalar(data_type)
+}
+
+// The list of operations currently supported.
+fn can_partial_eq_and_ord_scalar(data_type: &DataType) -> bool {
+    if let DataType::Dictionary(_, values, _) = data_type.to_logical_type() {
+        return can_partial_eq_and_ord_scalar(values.as_ref());
+    }
+    can_partial_eq_and_ord(data_type)
+}
+
+// The list of operations currently supported.
+fn can_partial_eq_and_ord(data_type: &DataType) -> bool {
+    matches!(
+        data_type,
+        DataType::Boolean
+            | DataType::Int8
+            | DataType::Int16
+            | DataType::Int32
+            | DataType::Date32
+            | DataType::Time32(_)
+            | DataType::Interval(IntervalUnit::YearMonth)
+            | DataType::Int64
+            | DataType::Timestamp(_, _)
+            | DataType::Date64
+            | DataType::Time64(_)
+            | DataType::Duration(_)
+            | DataType::UInt8
+            | DataType::UInt16
+            | DataType::UInt32
+            | DataType::UInt64
+            | DataType::Float32
+            | DataType::Float64
+            | DataType::Utf8
+            | DataType::LargeUtf8
+            | DataType::Decimal(_, _)
+            | DataType::Binary
+            | DataType::LargeBinary
+    )
+}
+
+// The list of operations currently supported.
+fn can_partial_eq(data_type: &DataType) -> bool {
+    can_partial_eq_and_ord(data_type)
+        || matches!(
+            data_type.to_logical_type(),
+            DataType::Float16
+                | DataType::Interval(IntervalUnit::DayTime)
+                | DataType::Interval(IntervalUnit::MonthDayNano)
+        )
+}
+
+// The list of operations currently supported.
+fn can_partial_eq_scalar(data_type: &DataType) -> bool {
+    can_partial_eq_and_ord_scalar(data_type)
+        || matches!(
+            data_type.to_logical_type(),
+            DataType::Interval(IntervalUnit::DayTime)
+                | DataType::Interval(IntervalUnit::MonthDayNano)
+        )
+}
+
+/// Utility for low level end users that implement their own comparison functions
+/// A comparison on the data column can be applied on masked out values
+/// This function will correct equality for the validities.
+pub fn finish_eq_validities(
+    output_without_validities: BooleanArray,
+    validity_lhs: Option<Bitmap>,
+    validity_rhs: Option<Bitmap>,
+) -> BooleanArray {
+    match (validity_lhs, validity_rhs) {
+        (None, None) => output_without_validities,
+        (Some(lhs), None) => compute::boolean::and(
+            &BooleanArray::new(DataType::Boolean, lhs, None),
+            &output_without_validities,
+        ),
+        (None, Some(rhs)) => compute::boolean::and(
+            &output_without_validities,
+            &BooleanArray::new(DataType::Boolean, rhs, None),
+        ),
+        (Some(lhs), Some(rhs)) => {
+            let lhs_validity_unset_bits = lhs.unset_bits();
+            let rhs_validity_unset_bits = rhs.unset_bits();
+
+            // this branch is a bit more complicated as both arrays can have masked out values
+            // these masked out values might differ and lead to a `eq == false` that has to
+            // be corrected as both should be `null == null = true`
+
+            let lhs = BooleanArray::new(DataType::Boolean, lhs, None);
+            let rhs = BooleanArray::new(DataType::Boolean, rhs, None);
+            let eq_validities = compute::comparison::boolean::eq(&lhs, &rhs);
+
+            // validity_bits are equal AND values are equal
+            let equal = compute::boolean::and(&output_without_validities, &eq_validities);
+
+            match (lhs_validity_unset_bits, rhs_validity_unset_bits) {
+                // there is at least one side with all values valid
+                // so we don't have to correct.
+                (0, _) | (_, 0) => equal,
+                _ => {
+                    // we use the binary kernel here to save allocations
+                    // and apply `!(lhs | rhs)` in one step
+                    let both_sides_invalid =
+                        compute::boolean::binary_boolean_kernel(&lhs, &rhs, |lhs, rhs| {
+                            binary(lhs, rhs, |lhs, rhs| !(lhs | rhs))
+                        });
+                    // this still might include incorrect masked out values
+                    // under the validity bits, so we must correct for that
+
+                    // if not all true, e.g. at least one is set.
+                    // then we propagate that null as `true` in equality
+                    if both_sides_invalid.values().unset_bits() != both_sides_invalid.len() {
+                        compute::boolean::or(&equal, &both_sides_invalid)
+                    } else {
+                        equal
+                    }
+                },
+            }
+        },
+    }
+}
+
+/// Utility for low level end users that implement their own comparison functions
+/// A comparison on the data column can be applied on masked out values
+/// This function will correct non-equality for the validities.
+pub fn finish_neq_validities(
+    output_without_validities: BooleanArray,
+    validity_lhs: Option<Bitmap>,
+    validity_rhs: Option<Bitmap>,
+) -> BooleanArray {
+    match (validity_lhs, validity_rhs) {
+        (None, None) => output_without_validities,
+        (Some(lhs), None) => {
+            let lhs_negated =
+                compute::boolean::not(&BooleanArray::new(DataType::Boolean, lhs, None));
+            compute::boolean::or(&lhs_negated, &output_without_validities)
+        },
+        (None, Some(rhs)) => {
+            let rhs_negated =
+                compute::boolean::not(&BooleanArray::new(DataType::Boolean, rhs, None));
+            compute::boolean::or(&output_without_validities, &rhs_negated)
+        },
+        (Some(lhs), Some(rhs)) => {
+            let lhs_validity_unset_bits = lhs.unset_bits();
+            let rhs_validity_unset_bits = rhs.unset_bits();
+
+            // this branch is a bit more complicated as both arrays can have masked out values
+            // these masked out values might differ and lead to a `neq == true` that has to
+            // be corrected as both should be `null != null = false`
+            let lhs = BooleanArray::new(DataType::Boolean, lhs, None);
+            let rhs = BooleanArray::new(DataType::Boolean, rhs, None);
+            let neq_validities = compute::comparison::boolean::neq(&lhs, &rhs);
+
+            // validity_bits are not equal OR values not equal
+            let or = compute::boolean::or(&output_without_validities, &neq_validities);
+
+            match (lhs_validity_unset_bits, rhs_validity_unset_bits) {
+                // there is at least one side with all values valid
+                // so we don't have to correct.
+                (0, _) | (_, 0) => or,
+                _ => {
+                    // we use the binary kernel here to save allocations
+                    // and apply `!(lhs | rhs)` in one step
+                    let both_sides_invalid =
+                        compute::boolean::binary_boolean_kernel(&lhs, &rhs, |lhs, rhs| {
+                            binary(lhs, rhs, |lhs, rhs| !(lhs | rhs))
+                        });
+                    // this still might include incorrect masked out values
+                    // under the validity bits, so we must correct for that
+
+                    // if not all true, e.g. at least one is set.
+                    // then we propagate that null as `false` as the nulls are equal
+                    if both_sides_invalid.values().unset_bits() != both_sides_invalid.len() {
+                        // we use the `binary` kernel directly to save allocations
+                        // and apply `lhs & !rhs)` in one shot.
+
+                        compute::boolean::binary_boolean_kernel(
+                            &or,
+                            &both_sides_invalid,
+                            |lhs, rhs| binary(lhs, rhs, |lhs, rhs| (lhs & !rhs)),
+                        )
+                    } else {
+                        or
+                    }
+                },
+            }
+        },
+    }
+}
diff --git a/crates/nano-arrow/src/compute/comparison/primitive.rs b/crates/nano-arrow/src/compute/comparison/primitive.rs
new file mode 100644
index 000000000000..5ecda063cd22
--- /dev/null
+++ b/crates/nano-arrow/src/compute/comparison/primitive.rs
@@ -0,0 +1,590 @@
+//! Comparison functions for [`PrimitiveArray`]
+use super::super::utils::combine_validities;
+use super::simd::{Simd8, Simd8Lanes, Simd8PartialEq, Simd8PartialOrd};
+use crate::array::{BooleanArray, PrimitiveArray};
+use crate::bitmap::MutableBitmap;
+use crate::compute::comparison::{finish_eq_validities, finish_neq_validities};
+use crate::datatypes::DataType;
+use crate::types::NativeType;
+
+pub(crate) fn compare_values_op<T, F>(lhs: &[T], rhs: &[T], op: F) -> MutableBitmap
+where
+    T: NativeType + Simd8,
+    F: Fn(T::Simd, T::Simd) -> u8,
+{
+    assert_eq!(lhs.len(), rhs.len());
+
+    let lhs_chunks_iter = lhs.chunks_exact(8);
+    let lhs_remainder = lhs_chunks_iter.remainder();
+    let rhs_chunks_iter = rhs.chunks_exact(8);
+    let rhs_remainder = rhs_chunks_iter.remainder();
+
+    let mut values = Vec::with_capacity((lhs.len() + 7) / 8);
+    let iterator = lhs_chunks_iter.zip(rhs_chunks_iter).map(|(lhs, rhs)| {
+        let lhs = T::Simd::from_chunk(lhs);
+        let rhs = T::Simd::from_chunk(rhs);
+        op(lhs, rhs)
+    });
+    values.extend(iterator);
+
+    if !lhs_remainder.is_empty() {
+        let lhs = T::Simd::from_incomplete_chunk(lhs_remainder, T::default());
+        let rhs = T::Simd::from_incomplete_chunk(rhs_remainder, T::default());
+        values.push(op(lhs, rhs))
+    };
+    MutableBitmap::from_vec(values, lhs.len())
+}
+
+pub(crate) fn compare_values_op_scalar<T, F>(lhs: &[T], rhs: T, op: F) -> MutableBitmap
+where
+    T: NativeType + Simd8,
+    F: Fn(T::Simd, T::Simd) -> u8,
+{
+    let rhs = T::Simd::from_chunk(&[rhs; 8]);
+
+    let lhs_chunks_iter = lhs.chunks_exact(8);
+    let lhs_remainder = lhs_chunks_iter.remainder();
+
+    let mut values = Vec::with_capacity((lhs.len() + 7) / 8);
+    let iterator = lhs_chunks_iter.map(|lhs| {
+        let lhs = T::Simd::from_chunk(lhs);
+        op(lhs, rhs)
+    });
+    values.extend(iterator);
+
+    if !lhs_remainder.is_empty() {
+        let lhs = T::Simd::from_incomplete_chunk(lhs_remainder, T::default());
+        values.push(op(lhs, rhs))
+    };
+
+    MutableBitmap::from_vec(values, lhs.len())
+}
+
+/// Evaluate `op(lhs, rhs)` for [`PrimitiveArray`]s using a specified
+/// comparison function.
+fn compare_op<T, F>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>, op: F) -> BooleanArray
+where
+    T: NativeType + Simd8,
+    F: Fn(T::Simd, T::Simd) -> u8,
+{
+    let validity = combine_validities(lhs.validity(), rhs.validity());
+
+    let values = compare_values_op(lhs.values(), rhs.values(), op);
+
+    BooleanArray::new(DataType::Boolean, values.into(), validity)
+}
+
+/// Evaluate `op(left, right)` for [`PrimitiveArray`] and scalar using
+/// a specified comparison function.
+pub fn compare_op_scalar<T, F>(lhs: &PrimitiveArray<T>, rhs: T, op: F) -> BooleanArray
+where
+    T: NativeType + Simd8,
+    F: Fn(T::Simd, T::Simd) -> u8,
+{
+    let validity = lhs.validity().cloned();
+
+    let values = compare_values_op_scalar(lhs.values(), rhs, op);
+
+    BooleanArray::new(DataType::Boolean, values.into(), validity)
+}
+
+/// Perform `lhs == rhs` operation on two arrays.
+pub fn eq<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> BooleanArray
+where
+    T: NativeType + Simd8,
+    T::Simd: Simd8PartialEq,
+{
+    compare_op(lhs, rhs, |a, b| a.eq(b))
+}
+
+/// Perform `lhs == rhs` operation on two arrays and include validities in comparison.
+pub fn eq_and_validity<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> BooleanArray
+where
+    T: NativeType + Simd8,
+    T::Simd: Simd8PartialEq,
+{
+    let validity_lhs = lhs.validity().cloned();
+    let validity_rhs = rhs.validity().cloned();
+    let lhs = lhs.clone().with_validity(None);
+    let rhs = rhs.clone().with_validity(None);
+    let out = compare_op(&lhs, &rhs, |a, b| a.eq(b));
+
+    finish_eq_validities(out, validity_lhs, validity_rhs)
+}
+
+/// Perform `left == right` operation on an array and a scalar value.
+pub fn eq_scalar<T>(lhs: &PrimitiveArray<T>, rhs: T) -> BooleanArray
+where
+    T: NativeType + Simd8,
+    T::Simd: Simd8PartialEq,
+{
+    compare_op_scalar(lhs, rhs, |a, b| a.eq(b))
+}
+
+/// Perform `left == right` operation on an array and a scalar value and include validities in comparison.
+pub fn eq_scalar_and_validity<T>(lhs: &PrimitiveArray<T>, rhs: T) -> BooleanArray
+where
+    T: NativeType + Simd8,
+    T::Simd: Simd8PartialEq,
+{
+    let validity = lhs.validity().cloned();
+    let lhs = lhs.clone().with_validity(None);
+    let out = compare_op_scalar(&lhs, rhs, |a, b| a.eq(b));
+
+    finish_eq_validities(out, validity, None)
+}
+
+/// Perform `left != right` operation on two arrays.
+pub fn neq<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> BooleanArray
+where
+    T: NativeType + Simd8,
+    T::Simd: Simd8PartialEq,
+{
+    compare_op(lhs, rhs, |a, b| a.neq(b))
+}
+
+/// Perform `left != right` operation on two arrays and include validities in comparison.
+pub fn neq_and_validity<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> BooleanArray
+where
+    T: NativeType + Simd8,
+    T::Simd: Simd8PartialEq,
+{
+    let validity_lhs = lhs.validity().cloned();
+    let validity_rhs = rhs.validity().cloned();
+    let lhs = lhs.clone().with_validity(None);
+    let rhs = rhs.clone().with_validity(None);
+    let out = compare_op(&lhs, &rhs, |a, b| a.neq(b));
+
+    finish_neq_validities(out, validity_lhs, validity_rhs)
+}
+
+/// Perform `left != right` operation on an array and a scalar value.
+pub fn neq_scalar<T>(lhs: &PrimitiveArray<T>, rhs: T) -> BooleanArray
+where
+    T: NativeType + Simd8,
+    T::Simd: Simd8PartialEq,
+{
+    compare_op_scalar(lhs, rhs, |a, b| a.neq(b))
+}
+
+/// Perform `left != right` operation on an array and a scalar value and include validities in comparison.
+pub fn neq_scalar_and_validity<T>(lhs: &PrimitiveArray<T>, rhs: T) -> BooleanArray
+where
+    T: NativeType + Simd8,
+    T::Simd: Simd8PartialEq,
+{
+    let validity = lhs.validity().cloned();
+    let lhs = lhs.clone().with_validity(None);
+    let out = compare_op_scalar(&lhs, rhs, |a, b| a.neq(b));
+
+    finish_neq_validities(out, validity, None)
+}
+
+/// Perform `left < right` operation on two arrays.
+pub fn lt<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> BooleanArray
+where
+    T: NativeType + Simd8,
+    T::Simd: Simd8PartialOrd,
+{
+    compare_op(lhs, rhs, |a, b| a.lt(b))
+}
+
+/// Perform `left < right` operation on an array and a scalar value.
+pub fn lt_scalar<T>(lhs: &PrimitiveArray<T>, rhs: T) -> BooleanArray
+where
+    T: NativeType + Simd8,
+    T::Simd: Simd8PartialOrd,
+{
+    compare_op_scalar(lhs, rhs, |a, b| a.lt(b))
+}
+
+/// Perform `left <= right` operation on two arrays.
+pub fn lt_eq<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> BooleanArray
+where
+    T: NativeType + Simd8,
+    T::Simd: Simd8PartialOrd,
+{
+    compare_op(lhs, rhs, |a, b| a.lt_eq(b))
+}
+
+/// Perform `left <= right` operation on an array and a scalar value.
+/// Null values are less than non-null values.
+pub fn lt_eq_scalar<T>(lhs: &PrimitiveArray<T>, rhs: T) -> BooleanArray
+where
+    T: NativeType + Simd8,
+    T::Simd: Simd8PartialOrd,
+{
+    compare_op_scalar(lhs, rhs, |a, b| a.lt_eq(b))
+}
+
+/// Perform `left > right` operation on two arrays. Non-null values are greater than null
+/// values.
+pub fn gt<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> BooleanArray
+where
+    T: NativeType + Simd8,
+    T::Simd: Simd8PartialOrd,
+{
+    compare_op(lhs, rhs, |a, b| a.gt(b))
+}
+
+/// Perform `left > right` operation on an array and a scalar value.
+/// Non-null values are greater than null values.
+pub fn gt_scalar<T>(lhs: &PrimitiveArray<T>, rhs: T) -> BooleanArray
+where
+    T: NativeType + Simd8,
+    T::Simd: Simd8PartialOrd,
+{
+    compare_op_scalar(lhs, rhs, |a, b| a.gt(b))
+}
+
+/// Perform `left >= right` operation on two arrays. Non-null values are greater than null
+/// values.
+pub fn gt_eq<T>(lhs: &PrimitiveArray<T>, rhs: &PrimitiveArray<T>) -> BooleanArray
+where
+    T: NativeType + Simd8,
+    T::Simd: Simd8PartialOrd,
+{
+    compare_op(lhs, rhs, |a, b| a.gt_eq(b))
+}
+
+/// Perform `left >= right` operation on an array and a scalar value.
+/// Non-null values are greater than null values.
+pub fn gt_eq_scalar<T>(lhs: &PrimitiveArray<T>, rhs: T) -> BooleanArray
+where
+    T: NativeType + Simd8,
+    T::Simd: Simd8PartialOrd,
+{
+    compare_op_scalar(lhs, rhs, |a, b| a.gt_eq(b))
+}
+
+// disable wrapping inside literal vectors used for test data and assertions
+#[rustfmt::skip::macros(vec)]
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::array::{Int64Array, Int8Array};
+
+    /// Evaluate `KERNEL` with two vectors as inputs and assert against the expected output.
+    /// `A_VEC` and `B_VEC` can be of type `Vec<i64>` or `Vec<Option<i64>>`.
+    /// `EXPECTED` can be either `Vec<bool>` or `Vec<Option<bool>>`.
+    /// The main reason for this macro is that inputs and outputs align nicely after `cargo fmt`.
+    macro_rules! cmp_i64 {
+        ($KERNEL:ident, $A_VEC:expr, $B_VEC:expr, $EXPECTED:expr) => {
+            let a = Int64Array::from_slice($A_VEC);
+            let b = Int64Array::from_slice($B_VEC);
+            let c = $KERNEL(&a, &b);
+            assert_eq!(BooleanArray::from_slice($EXPECTED), c);
+        };
+    }
+
+    macro_rules! cmp_i64_options {
+        ($KERNEL:ident, $A_VEC:expr, $B_VEC:expr, $EXPECTED:expr) => {
+            let a = Int64Array::from($A_VEC);
+            let b = Int64Array::from($B_VEC);
+            let c = $KERNEL(&a, &b);
+            assert_eq!(BooleanArray::from($EXPECTED), c);
+        };
+    }
+
+    /// Evaluate `KERNEL` with one vectors and one scalar as inputs and assert against the expected output.
+    /// `A_VEC` can be of type `Vec<i64>` or `Vec<Option<i64>>`.
+    /// `EXPECTED` can be either `Vec<bool>` or `Vec<Option<bool>>`.
+    /// The main reason for this macro is that inputs and outputs align nicely after `cargo fmt`.
+    macro_rules! cmp_i64_scalar_options {
+        ($KERNEL:ident, $A_VEC:expr, $B:literal, $EXPECTED:expr) => {
+            let a = Int64Array::from($A_VEC);
+            let c = $KERNEL(&a, $B);
+            assert_eq!(BooleanArray::from($EXPECTED), c);
+        };
+    }
+
+    macro_rules! cmp_i64_scalar {
+        ($KERNEL:ident, $A_VEC:expr, $B:literal, $EXPECTED:expr) => {
+            let a = Int64Array::from_slice($A_VEC);
+            let c = $KERNEL(&a, $B);
+            assert_eq!(BooleanArray::from_slice($EXPECTED), c);
+        };
+    }
+
+    #[test]
+    fn test_primitive_array_eq() {
+        cmp_i64!(
+            eq,
+            &[8, 8, 8, 8, 8, 8, 8, 8, 8, 8],
+            &[6, 7, 8, 9, 10, 6, 7, 8, 9, 10],
+            vec![false, false, true, false, false, false, false, true, false, false]
+        );
+    }
+
+    #[test]
+    fn test_primitive_array_eq_scalar() {
+        cmp_i64_scalar!(
+            eq_scalar,
+            &[6, 7, 8, 9, 10, 6, 7, 8, 9, 10],
+            8,
+            vec![false, false, true, false, false, false, false, true, false, false]
+        );
+    }
+
+    #[test]
+    fn test_primitive_array_eq_with_slice() {
+        let a = Int64Array::from_slice([6, 7, 8, 8, 10]);
+        let mut b = Int64Array::from_slice([1, 2, 3, 4, 5, 6, 7, 8, 9, 10]);
+        b.slice(5, 5);
+        let d = eq(&b, &a);
+        assert_eq!(d, BooleanArray::from_slice([true, true, true, false, true]));
+    }
+
+    #[test]
+    fn test_primitive_array_neq() {
+        cmp_i64!(
+            neq,
+            &[8, 8, 8, 8, 8, 8, 8, 8, 8, 8],
+            &[6, 7, 8, 9, 10, 6, 7, 8, 9, 10],
+            vec![true, true, false, true, true, true, true, false, true, true]
+        );
+    }
+
+    #[test]
+    fn test_primitive_array_neq_scalar() {
+        cmp_i64_scalar!(
+            neq_scalar,
+            &[6, 7, 8, 9, 10, 6, 7, 8, 9, 10],
+            8,
+            vec![true, true, false, true, true, true, true, false, true, true]
+        );
+    }
+
+    #[test]
+    fn test_primitive_array_lt() {
+        cmp_i64!(
+            lt,
+            &[8, 8, 8, 8, 8, 8, 8, 8, 8, 8],
+            &[6, 7, 8, 9, 10, 6, 7, 8, 9, 10],
+            vec![false, false, false, true, true, false, false, false, true, true]
+        );
+    }
+
+    #[test]
+    fn test_primitive_array_lt_scalar() {
+        cmp_i64_scalar!(
+            lt_scalar,
+            &[6, 7, 8, 9, 10, 6, 7, 8, 9, 10],
+            8,
+            vec![true, true, false, false, false, true, true, false, false, false]
+        );
+    }
+
+    #[test]
+    fn test_primitive_array_lt_nulls() {
+        cmp_i64_options!(
+            lt,
+            &[None, None, Some(1), Some(1), None, None, Some(2), Some(2),],
+            &[None, Some(1), None, Some(1), None, Some(3), None, Some(3),],
+            vec![None, None, None, Some(false), None, None, None, Some(true)]
+        );
+    }
+
+    #[test]
+    fn test_primitive_array_lt_scalar_nulls() {
+        cmp_i64_scalar_options!(
+            lt_scalar,
+            &[None, Some(1), Some(2), Some(3), None, Some(1), Some(2), Some(3), Some(2), None],
+            2,
+            vec![None, Some(true), Some(false), Some(false), None, Some(true), Some(false), Some(false), Some(false), None]
+        );
+    }
+
+    #[test]
+    fn test_primitive_array_lt_eq() {
+        cmp_i64!(
+            lt_eq,
+            &[8, 8, 8, 8, 8, 8, 8, 8, 8, 8],
+            &[6, 7, 8, 9, 10, 6, 7, 8, 9, 10],
+            vec![false, false, true, true, true, false, false, true, true, true]
+        );
+    }
+
+    #[test]
+    fn test_primitive_array_lt_eq_scalar() {
+        cmp_i64_scalar!(
+            lt_eq_scalar,
+            &[6, 7, 8, 9, 10, 6, 7, 8, 9, 10],
+            8,
+            vec![true, true, true, false, false, true, true, true, false, false]
+        );
+    }
+
+    #[test]
+    fn test_primitive_array_lt_eq_nulls() {
+        cmp_i64_options!(
+            lt_eq,
+            &[
+                None,
+                None,
+                Some(1),
+                None,
+                None,
+                Some(1),
+                None,
+                None,
+                Some(1)
+            ],
+            &[
+                None,
+                Some(1),
+                Some(0),
+                None,
+                Some(1),
+                Some(2),
+                None,
+                None,
+                Some(3)
+            ],
+            vec![None, None, Some(false), None, None, Some(true), None, None, Some(true)]
+        );
+    }
+
+    #[test]
+    fn test_primitive_array_lt_eq_scalar_nulls() {
+        cmp_i64_scalar_options!(
+            lt_eq_scalar,
+            &[None, Some(1), Some(2), None, Some(1), Some(2), None, Some(1), Some(2)],
+            1,
+            vec![None, Some(true), Some(false), None, Some(true), Some(false), None, Some(true), Some(false)]
+        );
+    }
+
+    #[test]
+    fn test_primitive_array_gt() {
+        cmp_i64!(
+            gt,
+            &[8, 8, 8, 8, 8, 8, 8, 8, 8, 8],
+            &[6, 7, 8, 9, 10, 6, 7, 8, 9, 10],
+            vec![true, true, false, false, false, true, true, false, false, false]
+        );
+    }
+
+    #[test]
+    fn test_primitive_array_gt_scalar() {
+        cmp_i64_scalar!(
+            gt_scalar,
+            &[6, 7, 8, 9, 10, 6, 7, 8, 9, 10],
+            8,
+            vec![false, false, false, true, true, false, false, false, true, true]
+        );
+    }
+
+    #[test]
+    fn test_primitive_array_gt_nulls() {
+        cmp_i64_options!(
+            gt,
+            &[
+                None,
+                None,
+                Some(1),
+                None,
+                None,
+                Some(2),
+                None,
+                None,
+                Some(3)
+            ],
+            &[
+                None,
+                Some(1),
+                Some(1),
+                None,
+                Some(1),
+                Some(1),
+                None,
+                Some(1),
+                Some(1)
+            ],
+            vec![None, None, Some(false), None, None, Some(true), None, None, Some(true)]
+        );
+    }
+
+    #[test]
+    fn test_primitive_array_gt_scalar_nulls() {
+        cmp_i64_scalar_options!(
+            gt_scalar,
+            &[None, Some(1), Some(2), None, Some(1), Some(2), None, Some(1), Some(2)],
+            1,
+            vec![None, Some(false), Some(true), None, Some(false), Some(true), None, Some(false), Some(true)]
+        );
+    }
+
+    #[test]
+    fn test_primitive_array_gt_eq() {
+        cmp_i64!(
+            gt_eq,
+            &[8, 8, 8, 8, 8, 8, 8, 8, 8, 8],
+            &[6, 7, 8, 9, 10, 6, 7, 8, 9, 10],
+            vec![true, true, true, false, false, true, true, true, false, false]
+        );
+    }
+
+    #[test]
+    fn test_primitive_array_gt_eq_scalar() {
+        cmp_i64_scalar!(
+            gt_eq_scalar,
+            &[6, 7, 8, 9, 10, 6, 7, 8, 9, 10],
+            8,
+            vec![false, false, true, true, true, false, false, true, true, true]
+        );
+    }
+
+    #[test]
+    fn test_primitive_array_gt_eq_nulls() {
+        cmp_i64_options!(
+            gt_eq,
+            vec![None, None, Some(1), None, Some(1), Some(2), None, None, Some(1)],
+            vec![None, Some(1), None, None, Some(1), Some(1), None, Some(2), Some(2)],
+            vec![None, None, None, None, Some(true), Some(true), None, None, Some(false)]
+        );
+    }
+
+    #[test]
+    fn test_primitive_array_gt_eq_scalar_nulls() {
+        cmp_i64_scalar_options!(
+            gt_eq_scalar,
+            vec![None, Some(1), Some(2), None, Some(2), Some(3), None, Some(3), Some(4)],
+            2,
+            vec![None, Some(false), Some(true), None, Some(true), Some(true), None, Some(true), Some(true)]
+        );
+    }
+
+    #[test]
+    fn test_primitive_array_compare_slice() {
+        let mut a = (0..100).map(Some).collect::<PrimitiveArray<i32>>();
+        a.slice(50, 50);
+        let mut b = (100..200).map(Some).collect::<PrimitiveArray<i32>>();
+        b.slice(50, 50);
+        let actual = lt(&a, &b);
+        let expected: BooleanArray = (0..50).map(|_| Some(true)).collect();
+        assert_eq!(expected, actual);
+    }
+
+    #[test]
+    fn test_primitive_array_compare_scalar_slice() {
+        let mut a = (0..100).map(Some).collect::<PrimitiveArray<i32>>();
+        a.slice(50, 50);
+        let actual = lt_scalar(&a, 200);
+        let expected: BooleanArray = (0..50).map(|_| Some(true)).collect();
+        assert_eq!(expected, actual);
+    }
+
+    #[test]
+    fn test_length_of_result_buffer() {
+        // `item_count` is chosen to not be a multiple of 64.
+        const ITEM_COUNT: usize = 130;
+
+        let array_a = Int8Array::from_slice([1; ITEM_COUNT]);
+        let array_b = Int8Array::from_slice([2; ITEM_COUNT]);
+        let expected = BooleanArray::from_slice([false; ITEM_COUNT]);
+        let result = gt_eq(&array_a, &array_b);
+
+        assert_eq!(result, expected)
+    }
+}
diff --git a/crates/nano-arrow/src/compute/comparison/simd/mod.rs b/crates/nano-arrow/src/compute/comparison/simd/mod.rs
new file mode 100644
index 000000000000..30d9773cd4c9
--- /dev/null
+++ b/crates/nano-arrow/src/compute/comparison/simd/mod.rs
@@ -0,0 +1,133 @@
+use crate::types::NativeType;
+
+/// [`NativeType`] that supports a representation of 8 lanes
+pub trait Simd8: NativeType {
+    /// The 8 lane representation of `Self`
+    type Simd: Simd8Lanes<Self>;
+}
+
+/// Trait declaring an 8-lane multi-data.
+pub trait Simd8Lanes<T>: Copy {
+    /// loads a complete chunk
+    fn from_chunk(v: &[T]) -> Self;
+    /// loads an incomplete chunk, filling the remaining items with `remaining`.
+    fn from_incomplete_chunk(v: &[T], remaining: T) -> Self;
+}
+
+/// Trait implemented by implementors of [`Simd8Lanes`] whose [`Simd8`] implements [PartialEq].
+pub trait Simd8PartialEq: Copy {
+    /// Equal
+    fn eq(self, other: Self) -> u8;
+    /// Not equal
+    fn neq(self, other: Self) -> u8;
+}
+
+/// Trait implemented by implementors of [`Simd8Lanes`] whose [`Simd8`] implements [PartialOrd].
+pub trait Simd8PartialOrd: Copy {
+    /// Less than or equal to
+    fn lt_eq(self, other: Self) -> u8;
+    /// Less than
+    fn lt(self, other: Self) -> u8;
+    /// Greater than
+    fn gt(self, other: Self) -> u8;
+    /// Greater than or equal to
+    fn gt_eq(self, other: Self) -> u8;
+}
+
+#[inline]
+pub(super) fn set<T: Copy, F: Fn(T, T) -> bool>(lhs: [T; 8], rhs: [T; 8], op: F) -> u8 {
+    let mut byte = 0u8;
+    lhs.iter()
+        .zip(rhs.iter())
+        .enumerate()
+        .for_each(|(i, (lhs, rhs))| {
+            byte |= if op(*lhs, *rhs) { 1 << i } else { 0 };
+        });
+    byte
+}
+
+/// Types that implement Simd8
+macro_rules! simd8_native {
+    ($type:ty) => {
+        impl Simd8 for $type {
+            type Simd = [$type; 8];
+        }
+
+        impl Simd8Lanes<$type> for [$type; 8] {
+            #[inline]
+            fn from_chunk(v: &[$type]) -> Self {
+                v.try_into().unwrap()
+            }
+
+            #[inline]
+            fn from_incomplete_chunk(v: &[$type], remaining: $type) -> Self {
+                let mut a = [remaining; 8];
+                a.iter_mut().zip(v.iter()).for_each(|(a, b)| *a = *b);
+                a
+            }
+        }
+    };
+}
+
+/// Types that implement PartialEq
+macro_rules! simd8_native_partial_eq {
+    ($type:ty) => {
+        impl Simd8PartialEq for [$type; 8] {
+            #[inline]
+            fn eq(self, other: Self) -> u8 {
+                set(self, other, |x, y| x == y)
+            }
+
+            #[inline]
+            fn neq(self, other: Self) -> u8 {
+                #[allow(clippy::float_cmp)]
+                set(self, other, |x, y| x != y)
+            }
+        }
+    };
+}
+
+/// Types that implement PartialOrd
+macro_rules! simd8_native_partial_ord {
+    ($type:ty) => {
+        impl Simd8PartialOrd for [$type; 8] {
+            #[inline]
+            fn lt_eq(self, other: Self) -> u8 {
+                set(self, other, |x, y| x <= y)
+            }
+
+            #[inline]
+            fn lt(self, other: Self) -> u8 {
+                set(self, other, |x, y| x < y)
+            }
+
+            #[inline]
+            fn gt_eq(self, other: Self) -> u8 {
+                set(self, other, |x, y| x >= y)
+            }
+
+            #[inline]
+            fn gt(self, other: Self) -> u8 {
+                set(self, other, |x, y| x > y)
+            }
+        }
+    };
+}
+
+/// Types that implement simd8, PartialEq and PartialOrd
+macro_rules! simd8_native_all {
+    ($type:ty) => {
+        simd8_native! {$type}
+        simd8_native_partial_eq! {$type}
+        simd8_native_partial_ord! {$type}
+    };
+}
+
+#[cfg(not(feature = "simd"))]
+mod native;
+#[cfg(not(feature = "simd"))]
+pub use native::*;
+#[cfg(feature = "simd")]
+mod packed;
+#[cfg(feature = "simd")]
+pub use packed::*;
diff --git a/crates/nano-arrow/src/compute/comparison/simd/native.rs b/crates/nano-arrow/src/compute/comparison/simd/native.rs
new file mode 100644
index 000000000000..b8bbf9b17d66
--- /dev/null
+++ b/crates/nano-arrow/src/compute/comparison/simd/native.rs
@@ -0,0 +1,23 @@
+use std::convert::TryInto;
+
+use super::{set, Simd8, Simd8Lanes, Simd8PartialEq, Simd8PartialOrd};
+use crate::types::{days_ms, f16, i256, months_days_ns};
+
+simd8_native_all!(u8);
+simd8_native_all!(u16);
+simd8_native_all!(u32);
+simd8_native_all!(u64);
+simd8_native_all!(i8);
+simd8_native_all!(i16);
+simd8_native_all!(i32);
+simd8_native_all!(i128);
+simd8_native_all!(i256);
+simd8_native_all!(i64);
+simd8_native!(f16);
+simd8_native_partial_eq!(f16);
+simd8_native_all!(f32);
+simd8_native_all!(f64);
+simd8_native!(days_ms);
+simd8_native_partial_eq!(days_ms);
+simd8_native!(months_days_ns);
+simd8_native_partial_eq!(months_days_ns);
diff --git a/crates/nano-arrow/src/compute/comparison/simd/packed.rs b/crates/nano-arrow/src/compute/comparison/simd/packed.rs
new file mode 100644
index 000000000000..707d875deef0
--- /dev/null
+++ b/crates/nano-arrow/src/compute/comparison/simd/packed.rs
@@ -0,0 +1,81 @@
+use std::convert::TryInto;
+use std::simd::{SimdPartialEq, SimdPartialOrd, ToBitMask};
+
+use super::*;
+use crate::types::simd::*;
+use crate::types::{days_ms, f16, i256, months_days_ns};
+
+macro_rules! simd8 {
+    ($type:ty, $md:ty) => {
+        impl Simd8 for $type {
+            type Simd = $md;
+        }
+
+        impl Simd8Lanes<$type> for $md {
+            #[inline]
+            fn from_chunk(v: &[$type]) -> Self {
+                <$md>::from_slice(v)
+            }
+
+            #[inline]
+            fn from_incomplete_chunk(v: &[$type], remaining: $type) -> Self {
+                let mut a = [remaining; 8];
+                a.iter_mut().zip(v.iter()).for_each(|(a, b)| *a = *b);
+                Self::from_array(a)
+            }
+        }
+
+        impl Simd8PartialEq for $md {
+            #[inline]
+            fn eq(self, other: Self) -> u8 {
+                self.simd_eq(other).to_bitmask()
+            }
+
+            #[inline]
+            fn neq(self, other: Self) -> u8 {
+                self.simd_ne(other).to_bitmask()
+            }
+        }
+
+        impl Simd8PartialOrd for $md {
+            #[inline]
+            fn lt_eq(self, other: Self) -> u8 {
+                self.simd_le(other).to_bitmask()
+            }
+
+            #[inline]
+            fn lt(self, other: Self) -> u8 {
+                self.simd_lt(other).to_bitmask()
+            }
+
+            #[inline]
+            fn gt_eq(self, other: Self) -> u8 {
+                self.simd_ge(other).to_bitmask()
+            }
+
+            #[inline]
+            fn gt(self, other: Self) -> u8 {
+                self.simd_gt(other).to_bitmask()
+            }
+        }
+    };
+}
+
+simd8!(u8, u8x8);
+simd8!(u16, u16x8);
+simd8!(u32, u32x8);
+simd8!(u64, u64x8);
+simd8!(i8, i8x8);
+simd8!(i16, i16x8);
+simd8!(i32, i32x8);
+simd8!(i64, i64x8);
+simd8_native_all!(i128);
+simd8_native_all!(i256);
+simd8_native!(f16);
+simd8_native_partial_eq!(f16);
+simd8!(f32, f32x8);
+simd8!(f64, f64x8);
+simd8_native!(days_ms);
+simd8_native_partial_eq!(days_ms);
+simd8_native!(months_days_ns);
+simd8_native_partial_eq!(months_days_ns);
diff --git a/crates/nano-arrow/src/compute/comparison/utf8.rs b/crates/nano-arrow/src/compute/comparison/utf8.rs
new file mode 100644
index 000000000000..cba683c7b869
--- /dev/null
+++ b/crates/nano-arrow/src/compute/comparison/utf8.rs
@@ -0,0 +1,291 @@
+//! Comparison functions for [`Utf8Array`]
+use super::super::utils::combine_validities;
+use crate::array::{BooleanArray, Utf8Array};
+use crate::bitmap::Bitmap;
+use crate::compute::comparison::{finish_eq_validities, finish_neq_validities};
+use crate::datatypes::DataType;
+use crate::offset::Offset;
+
+/// Evaluate `op(lhs, rhs)` for [`Utf8Array`]s using a specified
+/// comparison function.
+fn compare_op<O, F>(lhs: &Utf8Array<O>, rhs: &Utf8Array<O>, op: F) -> BooleanArray
+where
+    O: Offset,
+    F: Fn(&str, &str) -> bool,
+{
+    assert_eq!(lhs.len(), rhs.len());
+    let validity = combine_validities(lhs.validity(), rhs.validity());
+
+    let values = lhs
+        .values_iter()
+        .zip(rhs.values_iter())
+        .map(|(lhs, rhs)| op(lhs, rhs));
+    let values = Bitmap::from_trusted_len_iter(values);
+
+    BooleanArray::new(DataType::Boolean, values, validity)
+}
+
+/// Evaluate `op(lhs, rhs)` for [`Utf8Array`] and scalar using
+/// a specified comparison function.
+fn compare_op_scalar<O, F>(lhs: &Utf8Array<O>, rhs: &str, op: F) -> BooleanArray
+where
+    O: Offset,
+    F: Fn(&str, &str) -> bool,
+{
+    let validity = lhs.validity().cloned();
+
+    let values = lhs.values_iter().map(|lhs| op(lhs, rhs));
+    let values = Bitmap::from_trusted_len_iter(values);
+
+    BooleanArray::new(DataType::Boolean, values, validity)
+}
+
+/// Perform `lhs == rhs` operation on [`Utf8Array`].
+pub fn eq<O: Offset>(lhs: &Utf8Array<O>, rhs: &Utf8Array<O>) -> BooleanArray {
+    compare_op(lhs, rhs, |a, b| a == b)
+}
+
+/// Perform `lhs == rhs` operation on [`Utf8Array`] and include validities in comparison.
+pub fn eq_and_validity<O: Offset>(lhs: &Utf8Array<O>, rhs: &Utf8Array<O>) -> BooleanArray {
+    let validity_lhs = lhs.validity().cloned();
+    let validity_rhs = rhs.validity().cloned();
+    let lhs = lhs.clone().with_validity(None);
+    let rhs = rhs.clone().with_validity(None);
+    let out = compare_op(&lhs, &rhs, |a, b| a == b);
+
+    finish_eq_validities(out, validity_lhs, validity_rhs)
+}
+
+/// Perform `lhs != rhs` operation on [`Utf8Array`] and include validities in comparison.
+pub fn neq_and_validity<O: Offset>(lhs: &Utf8Array<O>, rhs: &Utf8Array<O>) -> BooleanArray {
+    let validity_lhs = lhs.validity().cloned();
+    let validity_rhs = rhs.validity().cloned();
+    let lhs = lhs.clone().with_validity(None);
+    let rhs = rhs.clone().with_validity(None);
+    let out = compare_op(&lhs, &rhs, |a, b| a != b);
+
+    finish_neq_validities(out, validity_lhs, validity_rhs)
+}
+
+/// Perform `lhs == rhs` operation on [`Utf8Array`] and a scalar.
+pub fn eq_scalar<O: Offset>(lhs: &Utf8Array<O>, rhs: &str) -> BooleanArray {
+    compare_op_scalar(lhs, rhs, |a, b| a == b)
+}
+
+/// Perform `lhs == rhs` operation on [`Utf8Array`] and a scalar. Also includes null values in comparison.
+pub fn eq_scalar_and_validity<O: Offset>(lhs: &Utf8Array<O>, rhs: &str) -> BooleanArray {
+    let validity = lhs.validity().cloned();
+    let lhs = lhs.clone().with_validity(None);
+    let out = compare_op_scalar(&lhs, rhs, |a, b| a == b);
+
+    finish_eq_validities(out, validity, None)
+}
+
+/// Perform `lhs != rhs` operation on [`Utf8Array`] and a scalar. Also includes null values in comparison.
+pub fn neq_scalar_and_validity<O: Offset>(lhs: &Utf8Array<O>, rhs: &str) -> BooleanArray {
+    let validity = lhs.validity().cloned();
+    let lhs = lhs.clone().with_validity(None);
+    let out = compare_op_scalar(&lhs, rhs, |a, b| a != b);
+
+    finish_neq_validities(out, validity, None)
+}
+
+/// Perform `lhs != rhs` operation on [`Utf8Array`].
+pub fn neq<O: Offset>(lhs: &Utf8Array<O>, rhs: &Utf8Array<O>) -> BooleanArray {
+    compare_op(lhs, rhs, |a, b| a != b)
+}
+
+/// Perform `lhs != rhs` operation on [`Utf8Array`] and a scalar.
+pub fn neq_scalar<O: Offset>(lhs: &Utf8Array<O>, rhs: &str) -> BooleanArray {
+    compare_op_scalar(lhs, rhs, |a, b| a != b)
+}
+
+/// Perform `lhs < rhs` operation on [`Utf8Array`].
+pub fn lt<O: Offset>(lhs: &Utf8Array<O>, rhs: &Utf8Array<O>) -> BooleanArray {
+    compare_op(lhs, rhs, |a, b| a < b)
+}
+
+/// Perform `lhs < rhs` operation on [`Utf8Array`] and a scalar.
+pub fn lt_scalar<O: Offset>(lhs: &Utf8Array<O>, rhs: &str) -> BooleanArray {
+    compare_op_scalar(lhs, rhs, |a, b| a < b)
+}
+
+/// Perform `lhs <= rhs` operation on [`Utf8Array`].
+pub fn lt_eq<O: Offset>(lhs: &Utf8Array<O>, rhs: &Utf8Array<O>) -> BooleanArray {
+    compare_op(lhs, rhs, |a, b| a <= b)
+}
+
+/// Perform `lhs <= rhs` operation on [`Utf8Array`] and a scalar.
+pub fn lt_eq_scalar<O: Offset>(lhs: &Utf8Array<O>, rhs: &str) -> BooleanArray {
+    compare_op_scalar(lhs, rhs, |a, b| a <= b)
+}
+
+/// Perform `lhs > rhs` operation on [`Utf8Array`].
+pub fn gt<O: Offset>(lhs: &Utf8Array<O>, rhs: &Utf8Array<O>) -> BooleanArray {
+    compare_op(lhs, rhs, |a, b| a > b)
+}
+
+/// Perform `lhs > rhs` operation on [`Utf8Array`] and a scalar.
+pub fn gt_scalar<O: Offset>(lhs: &Utf8Array<O>, rhs: &str) -> BooleanArray {
+    compare_op_scalar(lhs, rhs, |a, b| a > b)
+}
+
+/// Perform `lhs >= rhs` operation on [`Utf8Array`].
+pub fn gt_eq<O: Offset>(lhs: &Utf8Array<O>, rhs: &Utf8Array<O>) -> BooleanArray {
+    compare_op(lhs, rhs, |a, b| a >= b)
+}
+
+/// Perform `lhs >= rhs` operation on [`Utf8Array`] and a scalar.
+pub fn gt_eq_scalar<O: Offset>(lhs: &Utf8Array<O>, rhs: &str) -> BooleanArray {
+    compare_op_scalar(lhs, rhs, |a, b| a >= b)
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    fn test_generic<O: Offset, F: Fn(&Utf8Array<O>, &Utf8Array<O>) -> BooleanArray>(
+        lhs: Vec<&str>,
+        rhs: Vec<&str>,
+        op: F,
+        expected: Vec<bool>,
+    ) {
+        let lhs = Utf8Array::<O>::from_slice(lhs);
+        let rhs = Utf8Array::<O>::from_slice(rhs);
+        let expected = BooleanArray::from_slice(expected);
+        assert_eq!(op(&lhs, &rhs), expected);
+    }
+
+    fn test_generic_scalar<O: Offset, F: Fn(&Utf8Array<O>, &str) -> BooleanArray>(
+        lhs: Vec<&str>,
+        rhs: &str,
+        op: F,
+        expected: Vec<bool>,
+    ) {
+        let lhs = Utf8Array::<O>::from_slice(lhs);
+        let expected = BooleanArray::from_slice(expected);
+        assert_eq!(op(&lhs, rhs), expected);
+    }
+
+    #[test]
+    fn test_gt_eq() {
+        test_generic::<i32, _>(
+            vec!["arrow", "datafusion", "flight", "parquet"],
+            vec!["flight", "flight", "flight", "flight"],
+            gt_eq,
+            vec![false, false, true, true],
+        )
+    }
+
+    #[test]
+    fn test_gt_eq_scalar() {
+        test_generic_scalar::<i32, _>(
+            vec!["arrow", "datafusion", "flight", "parquet"],
+            "flight",
+            gt_eq_scalar,
+            vec![false, false, true, true],
+        )
+    }
+
+    #[test]
+    fn test_eq() {
+        test_generic::<i32, _>(
+            vec!["arrow", "arrow", "arrow", "arrow"],
+            vec!["arrow", "parquet", "datafusion", "flight"],
+            eq,
+            vec![true, false, false, false],
+        )
+    }
+
+    #[test]
+    fn test_eq_scalar() {
+        test_generic_scalar::<i32, _>(
+            vec!["arrow", "parquet", "datafusion", "flight"],
+            "arrow",
+            eq_scalar,
+            vec![true, false, false, false],
+        )
+    }
+
+    #[test]
+    fn test_neq() {
+        test_generic::<i32, _>(
+            vec!["arrow", "arrow", "arrow", "arrow"],
+            vec!["arrow", "parquet", "datafusion", "flight"],
+            neq,
+            vec![false, true, true, true],
+        )
+    }
+
+    #[test]
+    fn test_neq_scalar() {
+        test_generic_scalar::<i32, _>(
+            vec!["arrow", "parquet", "datafusion", "flight"],
+            "arrow",
+            neq_scalar,
+            vec![false, true, true, true],
+        )
+    }
+
+    /*
+    test_utf8!(
+        test_utf8_array_lt,
+        vec!["arrow", "datafusion", "flight", "parquet"],
+        vec!["flight", "flight", "flight", "flight"],
+        lt_utf8,
+        vec![true, true, false, false]
+    );
+    test_utf8_scalar!(
+        test_utf8_array_lt_scalar,
+        vec!["arrow", "datafusion", "flight", "parquet"],
+        "flight",
+        lt_utf8_scalar,
+        vec![true, true, false, false]
+    );
+
+    test_utf8!(
+        test_utf8_array_lt_eq,
+        vec!["arrow", "datafusion", "flight", "parquet"],
+        vec!["flight", "flight", "flight", "flight"],
+        lt_eq_utf8,
+        vec![true, true, true, false]
+    );
+    test_utf8_scalar!(
+        test_utf8_array_lt_eq_scalar,
+        vec!["arrow", "datafusion", "flight", "parquet"],
+        "flight",
+        lt_eq_utf8_scalar,
+        vec![true, true, true, false]
+    );
+
+    test_utf8!(
+        test_utf8_array_gt,
+        vec!["arrow", "datafusion", "flight", "parquet"],
+        vec!["flight", "flight", "flight", "flight"],
+        gt_utf8,
+        vec![false, false, false, true]
+    );
+    test_utf8_scalar!(
+        test_utf8_array_gt_scalar,
+        vec!["arrow", "datafusion", "flight", "parquet"],
+        "flight",
+        gt_utf8_scalar,
+        vec![false, false, false, true]
+    );
+
+    test_utf8!(
+        test_utf8_array_gt_eq,
+        vec!["arrow", "datafusion", "flight", "parquet"],
+        vec!["flight", "flight", "flight", "flight"],
+        gt_eq_utf8,
+        vec![false, false, true, true]
+    );
+    test_utf8_scalar!(
+        test_utf8_array_gt_eq_scalar,
+        vec!["arrow", "datafusion", "flight", "parquet"],
+        "flight",
+        gt_eq_utf8_scalar,
+        vec![false, false, true, true]
+    );
+    */
+}
diff --git a/crates/nano-arrow/src/compute/concatenate.rs b/crates/nano-arrow/src/compute/concatenate.rs
new file mode 100644
index 000000000000..5e38731a2fe9
--- /dev/null
+++ b/crates/nano-arrow/src/compute/concatenate.rs
@@ -0,0 +1,47 @@
+//! Contains the concatenate kernel
+//!
+//! Example:
+//!
+//! ```
+//! use arrow2::array::Utf8Array;
+//! use arrow2::compute::concatenate::concatenate;
+//!
+//! let arr = concatenate(&[
+//!     &Utf8Array::<i32>::from_slice(["hello", "world"]),
+//!     &Utf8Array::<i32>::from_slice(["!"]),
+//! ]).unwrap();
+//! assert_eq!(arr.len(), 3);
+//! ```
+
+use crate::array::growable::make_growable;
+use crate::array::Array;
+use crate::error::{Error, Result};
+
+/// Concatenate multiple [Array] of the same type into a single [`Array`].
+pub fn concatenate(arrays: &[&dyn Array]) -> Result<Box<dyn Array>> {
+    if arrays.is_empty() {
+        return Err(Error::InvalidArgumentError(
+            "concat requires input of at least one array".to_string(),
+        ));
+    }
+
+    if arrays
+        .iter()
+        .any(|array| array.data_type() != arrays[0].data_type())
+    {
+        return Err(Error::InvalidArgumentError(
+            "It is not possible to concatenate arrays of different data types.".to_string(),
+        ));
+    }
+
+    let lengths = arrays.iter().map(|array| array.len()).collect::<Vec<_>>();
+    let capacity = lengths.iter().sum();
+
+    let mut mutable = make_growable(arrays, false, capacity);
+
+    for (i, len) in lengths.iter().enumerate() {
+        mutable.extend(i, 0, *len)
+    }
+
+    Ok(mutable.as_box())
+}
diff --git a/crates/nano-arrow/src/compute/filter.rs b/crates/nano-arrow/src/compute/filter.rs
new file mode 100644
index 000000000000..90ddf4b4d158
--- /dev/null
+++ b/crates/nano-arrow/src/compute/filter.rs
@@ -0,0 +1,321 @@
+//! Contains operators to filter arrays such as [`filter`].
+use crate::array::growable::{make_growable, Growable};
+use crate::array::*;
+use crate::bitmap::utils::{BitChunkIterExact, BitChunksExact, SlicesIterator};
+use crate::bitmap::{Bitmap, MutableBitmap};
+use crate::chunk::Chunk;
+use crate::datatypes::DataType;
+use crate::error::Result;
+use crate::types::simd::Simd;
+use crate::types::{BitChunkOnes, NativeType};
+
+/// Function that can filter arbitrary arrays
+pub type Filter<'a> = Box<dyn Fn(&dyn Array) -> Box<dyn Array> + 'a + Send + Sync>;
+
+#[inline]
+fn get_leading_ones(chunk: u64) -> u32 {
+    if cfg!(target_endian = "little") {
+        chunk.trailing_ones()
+    } else {
+        chunk.leading_ones()
+    }
+}
+
+/// # Safety
+/// This assumes that the `mask_chunks` contains a number of set/true items equal
+/// to `filter_count`
+unsafe fn nonnull_filter_impl<T, I>(values: &[T], mut mask_chunks: I, filter_count: usize) -> Vec<T>
+where
+    T: NativeType + Simd,
+    I: BitChunkIterExact<u64>,
+{
+    let mut chunks = values.chunks_exact(64);
+    let mut new = Vec::<T>::with_capacity(filter_count);
+    let mut dst = new.as_mut_ptr();
+
+    chunks
+        .by_ref()
+        .zip(mask_chunks.by_ref())
+        .for_each(|(chunk, mask_chunk)| {
+            let ones = mask_chunk.count_ones();
+            let leading_ones = get_leading_ones(mask_chunk);
+
+            if ones == leading_ones {
+                let size = leading_ones as usize;
+                unsafe {
+                    std::ptr::copy(chunk.as_ptr(), dst, size);
+                    dst = dst.add(size);
+                }
+                return;
+            }
+
+            let ones_iter = BitChunkOnes::from_known_count(mask_chunk, ones as usize);
+            for pos in ones_iter {
+                dst.write(*chunk.get_unchecked(pos));
+                dst = dst.add(1);
+            }
+        });
+
+    chunks
+        .remainder()
+        .iter()
+        .zip(mask_chunks.remainder_iter())
+        .for_each(|(value, b)| {
+            if b {
+                unsafe {
+                    dst.write(*value);
+                    dst = dst.add(1);
+                };
+            }
+        });
+
+    unsafe { new.set_len(filter_count) };
+    new
+}
+
+/// # Safety
+/// This assumes that the `mask_chunks` contains a number of set/true items equal
+/// to `filter_count`
+unsafe fn null_filter_impl<T, I>(
+    values: &[T],
+    validity: &Bitmap,
+    mut mask_chunks: I,
+    filter_count: usize,
+) -> (Vec<T>, MutableBitmap)
+where
+    T: NativeType + Simd,
+    I: BitChunkIterExact<u64>,
+{
+    let mut chunks = values.chunks_exact(64);
+
+    let mut validity_chunks = validity.chunks::<u64>();
+
+    let mut new = Vec::<T>::with_capacity(filter_count);
+    let mut dst = new.as_mut_ptr();
+    let mut new_validity = MutableBitmap::with_capacity(filter_count);
+
+    chunks
+        .by_ref()
+        .zip(validity_chunks.by_ref())
+        .zip(mask_chunks.by_ref())
+        .for_each(|((chunk, validity_chunk), mask_chunk)| {
+            let ones = mask_chunk.count_ones();
+            let leading_ones = get_leading_ones(mask_chunk);
+
+            if ones == leading_ones {
+                let size = leading_ones as usize;
+                unsafe {
+                    std::ptr::copy(chunk.as_ptr(), dst, size);
+                    dst = dst.add(size);
+
+                    // safety: invariant offset + length <= slice.len()
+                    new_validity.extend_from_slice_unchecked(
+                        validity_chunk.to_ne_bytes().as_ref(),
+                        0,
+                        size,
+                    );
+                }
+                return;
+            }
+
+            // this triggers a bitcount
+            let ones_iter = BitChunkOnes::from_known_count(mask_chunk, ones as usize);
+            for pos in ones_iter {
+                dst.write(*chunk.get_unchecked(pos));
+                dst = dst.add(1);
+                new_validity.push_unchecked(validity_chunk & (1 << pos) > 0);
+            }
+        });
+
+    chunks
+        .remainder()
+        .iter()
+        .zip(validity_chunks.remainder_iter())
+        .zip(mask_chunks.remainder_iter())
+        .for_each(|((value, is_valid), is_selected)| {
+            if is_selected {
+                unsafe {
+                    dst.write(*value);
+                    dst = dst.add(1);
+                    new_validity.push_unchecked(is_valid);
+                };
+            }
+        });
+
+    unsafe { new.set_len(filter_count) };
+    (new, new_validity)
+}
+
+fn null_filter_simd<T: NativeType + Simd>(
+    values: &[T],
+    validity: &Bitmap,
+    mask: &Bitmap,
+) -> (Vec<T>, MutableBitmap) {
+    assert_eq!(values.len(), mask.len());
+    let filter_count = mask.len() - mask.unset_bits();
+
+    let (slice, offset, length) = mask.as_slice();
+    if offset == 0 {
+        let mask_chunks = BitChunksExact::<u64>::new(slice, length);
+        unsafe { null_filter_impl(values, validity, mask_chunks, filter_count) }
+    } else {
+        let mask_chunks = mask.chunks::<u64>();
+        unsafe { null_filter_impl(values, validity, mask_chunks, filter_count) }
+    }
+}
+
+fn nonnull_filter_simd<T: NativeType + Simd>(values: &[T], mask: &Bitmap) -> Vec<T> {
+    assert_eq!(values.len(), mask.len());
+    let filter_count = mask.len() - mask.unset_bits();
+
+    let (slice, offset, length) = mask.as_slice();
+    if offset == 0 {
+        let mask_chunks = BitChunksExact::<u64>::new(slice, length);
+        unsafe { nonnull_filter_impl(values, mask_chunks, filter_count) }
+    } else {
+        let mask_chunks = mask.chunks::<u64>();
+        unsafe { nonnull_filter_impl(values, mask_chunks, filter_count) }
+    }
+}
+
+fn filter_nonnull_primitive<T: NativeType + Simd>(
+    array: &PrimitiveArray<T>,
+    mask: &Bitmap,
+) -> PrimitiveArray<T> {
+    assert_eq!(array.len(), mask.len());
+
+    if let Some(validity) = array.validity() {
+        let (values, validity) = null_filter_simd(array.values(), validity, mask);
+        PrimitiveArray::<T>::new(array.data_type().clone(), values.into(), validity.into())
+    } else {
+        let values = nonnull_filter_simd(array.values(), mask);
+        PrimitiveArray::<T>::new(array.data_type().clone(), values.into(), None)
+    }
+}
+
+fn filter_primitive<T: NativeType + Simd>(
+    array: &PrimitiveArray<T>,
+    mask: &BooleanArray,
+) -> PrimitiveArray<T> {
+    // todo: branch on mask.validity()
+    filter_nonnull_primitive(array, mask.values())
+}
+
+fn filter_growable<'a>(growable: &mut impl Growable<'a>, chunks: &[(usize, usize)]) {
+    chunks
+        .iter()
+        .for_each(|(start, len)| growable.extend(0, *start, *len));
+}
+
+/// Returns a prepared function optimized to filter multiple arrays.
+/// Creating this function requires time, but using it is faster than [filter] when the
+/// same filter needs to be applied to multiple arrays (e.g. a multiple columns).
+pub fn build_filter(filter: &BooleanArray) -> Result<Filter> {
+    let iter = SlicesIterator::new(filter.values());
+    let filter_count = iter.slots();
+    let chunks = iter.collect::<Vec<_>>();
+
+    use crate::datatypes::PhysicalType::*;
+    Ok(Box::new(move |array: &dyn Array| {
+        match array.data_type().to_physical_type() {
+            Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+                let array = array.as_any().downcast_ref().unwrap();
+                let mut growable =
+                    growable::GrowablePrimitive::<$T>::new(vec![array], false, filter_count);
+                filter_growable(&mut growable, &chunks);
+                let array: PrimitiveArray<$T> = growable.into();
+                Box::new(array)
+            }),
+            LargeUtf8 => {
+                let array = array.as_any().downcast_ref::<Utf8Array<i64>>().unwrap();
+                let mut growable = growable::GrowableUtf8::new(vec![array], false, filter_count);
+                filter_growable(&mut growable, &chunks);
+                let array: Utf8Array<i64> = growable.into();
+                Box::new(array)
+            },
+            _ => {
+                let mut mutable = make_growable(&[array], false, filter_count);
+                chunks
+                    .iter()
+                    .for_each(|(start, len)| mutable.extend(0, *start, *len));
+                mutable.as_box()
+            },
+        }
+    }))
+}
+
+/// Filters an [Array], returning elements matching the filter (i.e. where the values are true).
+///
+/// Note that the nulls of `filter` are interpreted as `false` will lead to these elements being
+/// masked out.
+///
+/// # Example
+/// ```rust
+/// # use arrow2::array::{Int32Array, PrimitiveArray, BooleanArray};
+/// # use arrow2::error::Result;
+/// # use arrow2::compute::filter::filter;
+/// # fn main() -> Result<()> {
+/// let array = PrimitiveArray::from_slice([5, 6, 7, 8, 9]);
+/// let filter_array = BooleanArray::from_slice(&vec![true, false, false, true, false]);
+/// let c = filter(&array, &filter_array)?;
+/// let c = c.as_any().downcast_ref::<Int32Array>().unwrap();
+/// assert_eq!(c, &PrimitiveArray::from_slice(vec![5, 8]));
+/// # Ok(())
+/// # }
+/// ```
+pub fn filter(array: &dyn Array, filter: &BooleanArray) -> Result<Box<dyn Array>> {
+    // The validities may be masking out `true` bits, making the filter operation
+    // based on the values incorrect
+    if let Some(validities) = filter.validity() {
+        let values = filter.values();
+        let new_values = values & validities;
+        let filter = BooleanArray::new(DataType::Boolean, new_values, None);
+        return crate::compute::filter::filter(array, &filter);
+    }
+
+    let false_count = filter.values().unset_bits();
+    if false_count == filter.len() {
+        assert_eq!(array.len(), filter.len());
+        return Ok(new_empty_array(array.data_type().clone()));
+    }
+    if false_count == 0 {
+        assert_eq!(array.len(), filter.len());
+        return Ok(array.to_boxed());
+    }
+
+    use crate::datatypes::PhysicalType::*;
+    match array.data_type().to_physical_type() {
+        Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+            let array = array.as_any().downcast_ref().unwrap();
+            Ok(Box::new(filter_primitive::<$T>(array, filter)))
+        }),
+        _ => {
+            let iter = SlicesIterator::new(filter.values());
+            let mut mutable = make_growable(&[array], false, iter.slots());
+            iter.for_each(|(start, len)| mutable.extend(0, start, len));
+            Ok(mutable.as_box())
+        },
+    }
+}
+
+/// Returns a new [Chunk] with arrays containing only values matching the filter.
+/// This is a convenience function: filter multiple columns is embarrassingly parallel.
+pub fn filter_chunk<A: AsRef<dyn Array>>(
+    columns: &Chunk<A>,
+    filter_values: &BooleanArray,
+) -> Result<Chunk<Box<dyn Array>>> {
+    let arrays = columns.arrays();
+
+    let num_columns = arrays.len();
+
+    let filtered_arrays = match num_columns {
+        1 => {
+            vec![filter(columns.arrays()[0].as_ref(), filter_values)?]
+        },
+        _ => {
+            let filter = build_filter(filter_values)?;
+            arrays.iter().map(|a| filter(a.as_ref())).collect()
+        },
+    };
+    Chunk::try_new(filtered_arrays)
+}
diff --git a/crates/nano-arrow/src/compute/if_then_else.rs b/crates/nano-arrow/src/compute/if_then_else.rs
new file mode 100644
index 000000000000..86c46b29d040
--- /dev/null
+++ b/crates/nano-arrow/src/compute/if_then_else.rs
@@ -0,0 +1,75 @@
+//! Contains the operator [`if_then_else`].
+use crate::array::{growable, Array, BooleanArray};
+use crate::bitmap::utils::SlicesIterator;
+use crate::error::{Error, Result};
+
+/// Returns the values from `lhs` if the predicate is `true` or from the `rhs` if the predicate is false
+/// Returns `None` if the predicate is `None`.
+/// # Example
+/// ```rust
+/// # use arrow2::error::Result;
+/// use arrow2::compute::if_then_else::if_then_else;
+/// use arrow2::array::{Int32Array, BooleanArray};
+///
+/// # fn main() -> Result<()> {
+/// let lhs = Int32Array::from_slice(&[1, 2, 3]);
+/// let rhs = Int32Array::from_slice(&[4, 5, 6]);
+/// let predicate = BooleanArray::from(&[Some(true), None, Some(false)]);
+/// let result = if_then_else(&predicate, &lhs, &rhs)?;
+///
+/// let expected = Int32Array::from(&[Some(1), None, Some(6)]);
+///
+/// assert_eq!(expected, result.as_ref());
+/// # Ok(())
+/// # }
+/// ```
+pub fn if_then_else(
+    predicate: &BooleanArray,
+    lhs: &dyn Array,
+    rhs: &dyn Array,
+) -> Result<Box<dyn Array>> {
+    if lhs.data_type() != rhs.data_type() {
+        return Err(Error::InvalidArgumentError(format!(
+            "If then else requires the arguments to have the same datatypes ({:?} != {:?})",
+            lhs.data_type(),
+            rhs.data_type()
+        )));
+    }
+    if (lhs.len() != rhs.len()) | (lhs.len() != predicate.len()) {
+        return Err(Error::InvalidArgumentError(format!(
+            "If then else requires all arguments to have the same length (predicate = {}, lhs = {}, rhs = {})",
+            predicate.len(),
+            lhs.len(),
+            rhs.len()
+        )));
+    }
+
+    let result = if predicate.null_count() > 0 {
+        let mut growable = growable::make_growable(&[lhs, rhs], true, lhs.len());
+        for (i, v) in predicate.iter().enumerate() {
+            match v {
+                Some(v) => growable.extend(!v as usize, i, 1),
+                None => growable.extend_validity(1),
+            }
+        }
+        growable.as_box()
+    } else {
+        let mut growable = growable::make_growable(&[lhs, rhs], false, lhs.len());
+        let mut start_falsy = 0;
+        let mut total_len = 0;
+        for (start, len) in SlicesIterator::new(predicate.values()) {
+            if start != start_falsy {
+                growable.extend(1, start_falsy, start - start_falsy);
+                total_len += start - start_falsy;
+            };
+            growable.extend(0, start, len);
+            total_len += len;
+            start_falsy = start + len;
+        }
+        if total_len != lhs.len() {
+            growable.extend(1, total_len, lhs.len() - total_len);
+        }
+        growable.as_box()
+    };
+    Ok(result)
+}
diff --git a/crates/nano-arrow/src/compute/mod.rs b/crates/nano-arrow/src/compute/mod.rs
new file mode 100644
index 000000000000..a40e4dcbb558
--- /dev/null
+++ b/crates/nano-arrow/src/compute/mod.rs
@@ -0,0 +1,52 @@
+//! contains a wide range of compute operations (e.g.
+//! [`arithmetics`], [`aggregate`],
+//! [`filter`], [`comparison`], and [`sort`])
+//!
+//! This module's general design is
+//! that each operator has two interfaces, a statically-typed version and a dynamically-typed
+//! version.
+//! The statically-typed version expects concrete arrays (such as [`PrimitiveArray`](crate::array::PrimitiveArray));
+//! the dynamically-typed version expects `&dyn Array` and errors if the the type is not
+//! supported.
+//! Some dynamically-typed operators have an auxiliary function, `can_*`, that returns
+//! true if the operator can be applied to the particular `DataType`.
+
+#[cfg(any(feature = "compute_aggregate", feature = "io_parquet"))]
+#[cfg_attr(docsrs, doc(cfg(feature = "compute_aggregate")))]
+pub mod aggregate;
+#[cfg(feature = "compute_arithmetics")]
+#[cfg_attr(docsrs, doc(cfg(feature = "compute_arithmetics")))]
+pub mod arithmetics;
+pub mod arity;
+pub mod arity_assign;
+#[cfg(feature = "compute_bitwise")]
+#[cfg_attr(docsrs, doc(cfg(feature = "compute_bitwise")))]
+pub mod bitwise;
+#[cfg(feature = "compute_boolean")]
+#[cfg_attr(docsrs, doc(cfg(feature = "compute_boolean")))]
+pub mod boolean;
+#[cfg(feature = "compute_boolean_kleene")]
+#[cfg_attr(docsrs, doc(cfg(feature = "compute_boolean_kleene")))]
+pub mod boolean_kleene;
+#[cfg(feature = "compute_cast")]
+#[cfg_attr(docsrs, doc(cfg(feature = "compute_cast")))]
+pub mod cast;
+#[cfg(feature = "compute_comparison")]
+#[cfg_attr(docsrs, doc(cfg(feature = "compute_comparison")))]
+pub mod comparison;
+#[cfg(feature = "compute_concatenate")]
+#[cfg_attr(docsrs, doc(cfg(feature = "compute_concatenate")))]
+pub mod concatenate;
+#[cfg(feature = "compute_filter")]
+#[cfg_attr(docsrs, doc(cfg(feature = "compute_filter")))]
+pub mod filter;
+#[cfg(feature = "compute_if_then_else")]
+#[cfg_attr(docsrs, doc(cfg(feature = "compute_if_then_else")))]
+pub mod if_then_else;
+#[cfg(feature = "compute_take")]
+#[cfg_attr(docsrs, doc(cfg(feature = "compute_take")))]
+pub mod take;
+#[cfg(feature = "compute_temporal")]
+#[cfg_attr(docsrs, doc(cfg(feature = "compute_temporal")))]
+pub mod temporal;
+mod utils;
diff --git a/crates/nano-arrow/src/compute/take/binary.rs b/crates/nano-arrow/src/compute/take/binary.rs
new file mode 100644
index 000000000000..0e6460206f0e
--- /dev/null
+++ b/crates/nano-arrow/src/compute/take/binary.rs
@@ -0,0 +1,41 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use super::generic_binary::*;
+use super::Index;
+use crate::array::{Array, BinaryArray, PrimitiveArray};
+use crate::offset::Offset;
+
+/// `take` implementation for utf8 arrays
+pub fn take<O: Offset, I: Index>(
+    values: &BinaryArray<O>,
+    indices: &PrimitiveArray<I>,
+) -> BinaryArray<O> {
+    let data_type = values.data_type().clone();
+    let indices_has_validity = indices.null_count() > 0;
+    let values_has_validity = values.null_count() > 0;
+
+    let (offsets, values, validity) = match (values_has_validity, indices_has_validity) {
+        (false, false) => {
+            take_no_validity::<O, I>(values.offsets(), values.values(), indices.values())
+        },
+        (true, false) => take_values_validity(values, indices.values()),
+        (false, true) => take_indices_validity(values.offsets(), values.values(), indices),
+        (true, true) => take_values_indices_validity(values, indices),
+    };
+    BinaryArray::<O>::new(data_type, offsets, values, validity)
+}
diff --git a/crates/nano-arrow/src/compute/take/boolean.rs b/crates/nano-arrow/src/compute/take/boolean.rs
new file mode 100644
index 000000000000..62be88e46226
--- /dev/null
+++ b/crates/nano-arrow/src/compute/take/boolean.rs
@@ -0,0 +1,138 @@
+use super::Index;
+use crate::array::{Array, BooleanArray, PrimitiveArray};
+use crate::bitmap::{Bitmap, MutableBitmap};
+
+// take implementation when neither values nor indices contain nulls
+fn take_no_validity<I: Index>(values: &Bitmap, indices: &[I]) -> (Bitmap, Option<Bitmap>) {
+    let values = indices.iter().map(|index| values.get_bit(index.to_usize()));
+    let buffer = Bitmap::from_trusted_len_iter(values);
+
+    (buffer, None)
+}
+
+// take implementation when only values contain nulls
+fn take_values_validity<I: Index>(
+    values: &BooleanArray,
+    indices: &[I],
+) -> (Bitmap, Option<Bitmap>) {
+    let validity_values = values.validity().unwrap();
+    let validity = indices
+        .iter()
+        .map(|index| validity_values.get_bit(index.to_usize()));
+    let validity = Bitmap::from_trusted_len_iter(validity);
+
+    let values_values = values.values();
+    let values = indices
+        .iter()
+        .map(|index| values_values.get_bit(index.to_usize()));
+    let buffer = Bitmap::from_trusted_len_iter(values);
+
+    (buffer, validity.into())
+}
+
+// take implementation when only indices contain nulls
+fn take_indices_validity<I: Index>(
+    values: &Bitmap,
+    indices: &PrimitiveArray<I>,
+) -> (Bitmap, Option<Bitmap>) {
+    let validity = indices.validity().unwrap();
+
+    let values = indices.values().iter().enumerate().map(|(i, index)| {
+        let index = index.to_usize();
+        match values.get(index) {
+            Some(value) => value,
+            None => {
+                if !validity.get_bit(i) {
+                    false
+                } else {
+                    panic!("Out-of-bounds index {index}")
+                }
+            },
+        }
+    });
+
+    let buffer = Bitmap::from_trusted_len_iter(values);
+
+    (buffer, indices.validity().cloned())
+}
+
+// take implementation when both values and indices contain nulls
+fn take_values_indices_validity<I: Index>(
+    values: &BooleanArray,
+    indices: &PrimitiveArray<I>,
+) -> (Bitmap, Option<Bitmap>) {
+    let mut validity = MutableBitmap::with_capacity(indices.len());
+
+    let values_validity = values.validity().unwrap();
+
+    let values_values = values.values();
+    let values = indices.iter().map(|index| match index {
+        Some(index) => {
+            let index = index.to_usize();
+            validity.push(values_validity.get_bit(index));
+            values_values.get_bit(index)
+        },
+        None => {
+            validity.push(false);
+            false
+        },
+    });
+    let values = Bitmap::from_trusted_len_iter(values);
+    (values, validity.into())
+}
+
+/// `take` implementation for boolean arrays
+pub fn take<I: Index>(values: &BooleanArray, indices: &PrimitiveArray<I>) -> BooleanArray {
+    let data_type = values.data_type().clone();
+    let indices_has_validity = indices.null_count() > 0;
+    let values_has_validity = values.null_count() > 0;
+
+    let (values, validity) = match (values_has_validity, indices_has_validity) {
+        (false, false) => take_no_validity(values.values(), indices.values()),
+        (true, false) => take_values_validity(values, indices.values()),
+        (false, true) => take_indices_validity(values.values(), indices),
+        (true, true) => take_values_indices_validity(values, indices),
+    };
+
+    BooleanArray::new(data_type, values, validity)
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::array::Int32Array;
+
+    fn _all_cases() -> Vec<(Int32Array, BooleanArray, BooleanArray)> {
+        vec![
+            (
+                Int32Array::from(&[Some(1), Some(0)]),
+                BooleanArray::from(vec![Some(true), Some(false)]),
+                BooleanArray::from(vec![Some(false), Some(true)]),
+            ),
+            (
+                Int32Array::from(&[Some(1), None]),
+                BooleanArray::from(vec![Some(true), Some(false)]),
+                BooleanArray::from(vec![Some(false), None]),
+            ),
+            (
+                Int32Array::from(&[Some(1), Some(0)]),
+                BooleanArray::from(vec![None, Some(false)]),
+                BooleanArray::from(vec![Some(false), None]),
+            ),
+            (
+                Int32Array::from(&[Some(1), None, Some(0)]),
+                BooleanArray::from(vec![None, Some(false)]),
+                BooleanArray::from(vec![Some(false), None, None]),
+            ),
+        ]
+    }
+
+    #[test]
+    fn all_cases() {
+        let cases = _all_cases();
+        for (indices, input, expected) in cases {
+            let output = take(&input, &indices);
+            assert_eq!(expected, output);
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/compute/take/dict.rs b/crates/nano-arrow/src/compute/take/dict.rs
new file mode 100644
index 000000000000..bb60c09193f7
--- /dev/null
+++ b/crates/nano-arrow/src/compute/take/dict.rs
@@ -0,0 +1,41 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use super::primitive::take as take_primitive;
+use super::Index;
+use crate::array::{DictionaryArray, DictionaryKey, PrimitiveArray};
+
+/// `take` implementation for dictionary arrays
+///
+/// applies `take` to the keys of the dictionary array and returns a new dictionary array
+/// with the same dictionary values and reordered keys
+pub fn take<K, I>(values: &DictionaryArray<K>, indices: &PrimitiveArray<I>) -> DictionaryArray<K>
+where
+    K: DictionaryKey,
+    I: Index,
+{
+    let keys = take_primitive::<K, I>(values.keys(), indices);
+    // safety - this operation takes a subset of keys and thus preserves the dictionary's invariant
+    unsafe {
+        DictionaryArray::<K>::try_new_unchecked(
+            values.data_type().clone(),
+            keys,
+            values.values().clone(),
+        )
+        .unwrap()
+    }
+}
diff --git a/crates/nano-arrow/src/compute/take/fixed_size_list.rs b/crates/nano-arrow/src/compute/take/fixed_size_list.rs
new file mode 100644
index 000000000000..6e7e74b91720
--- /dev/null
+++ b/crates/nano-arrow/src/compute/take/fixed_size_list.rs
@@ -0,0 +1,63 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use super::Index;
+use crate::array::growable::{Growable, GrowableFixedSizeList};
+use crate::array::{FixedSizeListArray, PrimitiveArray};
+
+/// `take` implementation for FixedSizeListArrays
+pub fn take<O: Index>(
+    values: &FixedSizeListArray,
+    indices: &PrimitiveArray<O>,
+) -> FixedSizeListArray {
+    let mut capacity = 0;
+    let arrays = indices
+        .values()
+        .iter()
+        .map(|index| {
+            let index = index.to_usize();
+            let slice = values.clone().sliced(index, 1);
+            capacity += slice.len();
+            slice
+        })
+        .collect::<Vec<FixedSizeListArray>>();
+
+    let arrays = arrays.iter().collect();
+
+    if let Some(validity) = indices.validity() {
+        let mut growable: GrowableFixedSizeList =
+            GrowableFixedSizeList::new(arrays, true, capacity);
+
+        for index in 0..indices.len() {
+            if validity.get_bit(index) {
+                growable.extend(index, 0, 1);
+            } else {
+                growable.extend_validity(1)
+            }
+        }
+
+        growable.into()
+    } else {
+        let mut growable: GrowableFixedSizeList =
+            GrowableFixedSizeList::new(arrays, false, capacity);
+        for index in 0..indices.len() {
+            growable.extend(index, 0, 1);
+        }
+
+        growable.into()
+    }
+}
diff --git a/crates/nano-arrow/src/compute/take/generic_binary.rs b/crates/nano-arrow/src/compute/take/generic_binary.rs
new file mode 100644
index 000000000000..9f6658c7d5a0
--- /dev/null
+++ b/crates/nano-arrow/src/compute/take/generic_binary.rs
@@ -0,0 +1,155 @@
+use super::Index;
+use crate::array::{GenericBinaryArray, PrimitiveArray};
+use crate::bitmap::{Bitmap, MutableBitmap};
+use crate::buffer::Buffer;
+use crate::offset::{Offset, Offsets, OffsetsBuffer};
+
+pub fn take_values<O: Offset>(
+    length: O,
+    starts: &[O],
+    offsets: &OffsetsBuffer<O>,
+    values: &[u8],
+) -> Buffer<u8> {
+    let new_len = length.to_usize();
+    let mut buffer = Vec::with_capacity(new_len);
+    starts
+        .iter()
+        .map(|start| start.to_usize())
+        .zip(offsets.lengths())
+        .for_each(|(start, length)| {
+            let end = start + length;
+            buffer.extend_from_slice(&values[start..end]);
+        });
+    buffer.into()
+}
+
+// take implementation when neither values nor indices contain nulls
+pub fn take_no_validity<O: Offset, I: Index>(
+    offsets: &OffsetsBuffer<O>,
+    values: &[u8],
+    indices: &[I],
+) -> (OffsetsBuffer<O>, Buffer<u8>, Option<Bitmap>) {
+    let mut buffer = Vec::<u8>::new();
+    let lengths = indices.iter().map(|index| index.to_usize()).map(|index| {
+        let (start, end) = offsets.start_end(index);
+        // todo: remove this bound check
+        buffer.extend_from_slice(&values[start..end]);
+        end - start
+    });
+    let offsets = Offsets::try_from_lengths(lengths).expect("");
+
+    (offsets.into(), buffer.into(), None)
+}
+
+// take implementation when only values contain nulls
+pub fn take_values_validity<O: Offset, I: Index, A: GenericBinaryArray<O>>(
+    values: &A,
+    indices: &[I],
+) -> (OffsetsBuffer<O>, Buffer<u8>, Option<Bitmap>) {
+    let validity_values = values.validity().unwrap();
+    let validity = indices
+        .iter()
+        .map(|index| validity_values.get_bit(index.to_usize()));
+    let validity = Bitmap::from_trusted_len_iter(validity);
+
+    let mut length = O::default();
+
+    let offsets = values.offsets();
+    let values_values = values.values();
+
+    let mut starts = Vec::<O>::with_capacity(indices.len());
+    let offsets = indices.iter().map(|index| {
+        let index = index.to_usize();
+        let start = offsets[index];
+        length += offsets[index + 1] - start;
+        starts.push(start);
+        length
+    });
+    let offsets = std::iter::once(O::default())
+        .chain(offsets)
+        .collect::<Vec<_>>();
+    // Safety: by construction offsets are monotonically increasing
+    let offsets = unsafe { Offsets::new_unchecked(offsets) }.into();
+
+    let buffer = take_values(length, starts.as_slice(), &offsets, values_values);
+
+    (offsets, buffer, validity.into())
+}
+
+// take implementation when only indices contain nulls
+pub fn take_indices_validity<O: Offset, I: Index>(
+    offsets: &OffsetsBuffer<O>,
+    values: &[u8],
+    indices: &PrimitiveArray<I>,
+) -> (OffsetsBuffer<O>, Buffer<u8>, Option<Bitmap>) {
+    let mut length = O::default();
+
+    let offsets = offsets.buffer();
+
+    let mut starts = Vec::<O>::with_capacity(indices.len());
+    let offsets = indices.values().iter().map(|index| {
+        let index = index.to_usize();
+        match offsets.get(index + 1) {
+            Some(&next) => {
+                let start = offsets[index];
+                length += next - start;
+                starts.push(start);
+            },
+            None => starts.push(O::default()),
+        };
+        length
+    });
+    let offsets = std::iter::once(O::default())
+        .chain(offsets)
+        .collect::<Vec<_>>();
+    // Safety: by construction offsets are monotonically increasing
+    let offsets = unsafe { Offsets::new_unchecked(offsets) }.into();
+
+    let buffer = take_values(length, &starts, &offsets, values);
+
+    (offsets, buffer, indices.validity().cloned())
+}
+
+// take implementation when both indices and values contain nulls
+pub fn take_values_indices_validity<O: Offset, I: Index, A: GenericBinaryArray<O>>(
+    values: &A,
+    indices: &PrimitiveArray<I>,
+) -> (OffsetsBuffer<O>, Buffer<u8>, Option<Bitmap>) {
+    let mut length = O::default();
+    let mut validity = MutableBitmap::with_capacity(indices.len());
+
+    let values_validity = values.validity().unwrap();
+    let offsets = values.offsets();
+    let values_values = values.values();
+
+    let mut starts = Vec::<O>::with_capacity(indices.len());
+    let offsets = indices.iter().map(|index| {
+        match index {
+            Some(index) => {
+                let index = index.to_usize();
+                if values_validity.get_bit(index) {
+                    validity.push(true);
+                    length += offsets[index + 1] - offsets[index];
+                    starts.push(offsets[index]);
+                } else {
+                    validity.push(false);
+                    starts.push(O::default());
+                }
+            },
+            None => {
+                validity.push(false);
+                starts.push(O::default());
+            },
+        };
+        length
+    });
+    let offsets = std::iter::once(O::default())
+        .chain(offsets)
+        .collect::<Vec<_>>();
+    // Safety: by construction offsets are monotonically increasing
+    let offsets = unsafe { Offsets::new_unchecked(offsets) }.into();
+
+    let buffer = take_values(length, &starts, &offsets, values_values);
+
+    (offsets, buffer, validity.into())
+}
diff --git a/crates/nano-arrow/src/compute/take/list.rs b/crates/nano-arrow/src/compute/take/list.rs
new file mode 100644
index 000000000000..58fb9d6fd788
--- /dev/null
+++ b/crates/nano-arrow/src/compute/take/list.rs
@@ -0,0 +1,62 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use super::Index;
+use crate::array::growable::{Growable, GrowableList};
+use crate::array::{ListArray, PrimitiveArray};
+use crate::offset::Offset;
+
+/// `take` implementation for ListArrays
+pub fn take<I: Offset, O: Index>(
+    values: &ListArray<I>,
+    indices: &PrimitiveArray<O>,
+) -> ListArray<I> {
+    let mut capacity = 0;
+    let arrays = indices
+        .values()
+        .iter()
+        .map(|index| {
+            let index = index.to_usize();
+            let slice = values.clone().sliced(index, 1);
+            capacity += slice.len();
+            slice
+        })
+        .collect::<Vec<ListArray<I>>>();
+
+    let arrays = arrays.iter().collect();
+
+    if let Some(validity) = indices.validity() {
+        let mut growable: GrowableList<I> = GrowableList::new(arrays, true, capacity);
+
+        for index in 0..indices.len() {
+            if validity.get_bit(index) {
+                growable.extend(index, 0, 1);
+            } else {
+                growable.extend_validity(1)
+            }
+        }
+
+        growable.into()
+    } else {
+        let mut growable: GrowableList<I> = GrowableList::new(arrays, false, capacity);
+        for index in 0..indices.len() {
+            growable.extend(index, 0, 1);
+        }
+
+        growable.into()
+    }
+}
diff --git a/crates/nano-arrow/src/compute/take/mod.rs b/crates/nano-arrow/src/compute/take/mod.rs
new file mode 100644
index 000000000000..d526713a4327
--- /dev/null
+++ b/crates/nano-arrow/src/compute/take/mod.rs
@@ -0,0 +1,132 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Defines take kernel for [`Array`]
+
+use crate::array::{new_empty_array, Array, NullArray, PrimitiveArray};
+use crate::datatypes::DataType;
+use crate::error::Result;
+use crate::types::Index;
+
+mod binary;
+mod boolean;
+mod dict;
+mod fixed_size_list;
+mod generic_binary;
+mod list;
+mod primitive;
+mod structure;
+mod utf8;
+
+pub(crate) use boolean::take as take_boolean;
+
+/// Returns a new [`Array`] with only indices at `indices`. Null indices are taken as nulls.
+/// The returned array has a length equal to `indices.len()`.
+pub fn take<O: Index>(values: &dyn Array, indices: &PrimitiveArray<O>) -> Result<Box<dyn Array>> {
+    if indices.len() == 0 {
+        return Ok(new_empty_array(values.data_type().clone()));
+    }
+
+    use crate::datatypes::PhysicalType::*;
+    match values.data_type().to_physical_type() {
+        Null => Ok(Box::new(NullArray::new(
+            values.data_type().clone(),
+            indices.len(),
+        ))),
+        Boolean => {
+            let values = values.as_any().downcast_ref().unwrap();
+            Ok(Box::new(boolean::take::<O>(values, indices)))
+        },
+        Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+            let values = values.as_any().downcast_ref().unwrap();
+            Ok(Box::new(primitive::take::<$T, _>(&values, indices)))
+        }),
+        LargeUtf8 => {
+            let values = values.as_any().downcast_ref().unwrap();
+            Ok(Box::new(utf8::take::<i64, _>(values, indices)))
+        },
+        LargeBinary => {
+            let values = values.as_any().downcast_ref().unwrap();
+            Ok(Box::new(binary::take::<i64, _>(values, indices)))
+        },
+        Dictionary(key_type) => {
+            match_integer_type!(key_type, |$T| {
+                let values = values.as_any().downcast_ref().unwrap();
+                Ok(Box::new(dict::take::<$T, _>(&values, indices)))
+            })
+        },
+        Struct => {
+            let array = values.as_any().downcast_ref().unwrap();
+            Ok(Box::new(structure::take::<_>(array, indices)?))
+        },
+        LargeList => {
+            let array = values.as_any().downcast_ref().unwrap();
+            Ok(Box::new(list::take::<i64, O>(array, indices)))
+        },
+        FixedSizeList => {
+            let array = values.as_any().downcast_ref().unwrap();
+            Ok(Box::new(fixed_size_list::take::<O>(array, indices)))
+        },
+        t => unimplemented!("Take not supported for data type {:?}", t),
+    }
+}
+
+/// Checks if an array of type `datatype` can perform take operation
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::take::can_take;
+/// use arrow2::datatypes::{DataType};
+///
+/// let data_type = DataType::Int8;
+/// assert_eq!(can_take(&data_type), true);
+/// ```
+pub fn can_take(data_type: &DataType) -> bool {
+    matches!(
+        data_type,
+        DataType::Null
+            | DataType::Boolean
+            | DataType::Int8
+            | DataType::Int16
+            | DataType::Int32
+            | DataType::Date32
+            | DataType::Time32(_)
+            | DataType::Interval(_)
+            | DataType::Int64
+            | DataType::Date64
+            | DataType::Time64(_)
+            | DataType::Duration(_)
+            | DataType::Timestamp(_, _)
+            | DataType::UInt8
+            | DataType::UInt16
+            | DataType::UInt32
+            | DataType::UInt64
+            | DataType::Float16
+            | DataType::Float32
+            | DataType::Float64
+            | DataType::Decimal(_, _)
+            | DataType::Utf8
+            | DataType::LargeUtf8
+            | DataType::Binary
+            | DataType::LargeBinary
+            | DataType::Struct(_)
+            | DataType::List(_)
+            | DataType::LargeList(_)
+            | DataType::FixedSizeList(_, _)
+            | DataType::Dictionary(..)
+    )
+}
diff --git a/crates/nano-arrow/src/compute/take/primitive.rs b/crates/nano-arrow/src/compute/take/primitive.rs
new file mode 100644
index 000000000000..5ce53ba7cc20
--- /dev/null
+++ b/crates/nano-arrow/src/compute/take/primitive.rs
@@ -0,0 +1,112 @@
+use super::Index;
+use crate::array::{Array, PrimitiveArray};
+use crate::bitmap::{Bitmap, MutableBitmap};
+use crate::buffer::Buffer;
+use crate::types::NativeType;
+
+// take implementation when neither values nor indices contain nulls
+fn take_no_validity<T: NativeType, I: Index>(
+    values: &[T],
+    indices: &[I],
+) -> (Buffer<T>, Option<Bitmap>) {
+    let values = indices
+        .iter()
+        .map(|index| values[index.to_usize()])
+        .collect::<Vec<_>>();
+
+    (values.into(), None)
+}
+
+// take implementation when only values contain nulls
+fn take_values_validity<T: NativeType, I: Index>(
+    values: &PrimitiveArray<T>,
+    indices: &[I],
+) -> (Buffer<T>, Option<Bitmap>) {
+    let values_validity = values.validity().unwrap();
+
+    let validity = indices
+        .iter()
+        .map(|index| values_validity.get_bit(index.to_usize()));
+    let validity = MutableBitmap::from_trusted_len_iter(validity);
+
+    let values_values = values.values();
+
+    let values = indices
+        .iter()
+        .map(|index| values_values[index.to_usize()])
+        .collect::<Vec<_>>();
+
+    (values.into(), validity.into())
+}
+
+// take implementation when only indices contain nulls
+fn take_indices_validity<T: NativeType, I: Index>(
+    values: &[T],
+    indices: &PrimitiveArray<I>,
+) -> (Buffer<T>, Option<Bitmap>) {
+    let validity = indices.validity().unwrap();
+    let values = indices
+        .values()
+        .iter()
+        .enumerate()
+        .map(|(i, index)| {
+            let index = index.to_usize();
+            match values.get(index) {
+                Some(value) => *value,
+                None => {
+                    if !validity.get_bit(i) {
+                        T::default()
+                    } else {
+                        panic!("Out-of-bounds index {index}")
+                    }
+                },
+            }
+        })
+        .collect::<Vec<_>>();
+
+    (values.into(), indices.validity().cloned())
+}
+
+// take implementation when both values and indices contain nulls
+fn take_values_indices_validity<T: NativeType, I: Index>(
+    values: &PrimitiveArray<T>,
+    indices: &PrimitiveArray<I>,
+) -> (Buffer<T>, Option<Bitmap>) {
+    let mut bitmap = MutableBitmap::with_capacity(indices.len());
+
+    let values_validity = values.validity().unwrap();
+
+    let values_values = values.values();
+    let values = indices
+        .iter()
+        .map(|index| match index {
+            Some(index) => {
+                let index = index.to_usize();
+                bitmap.push(values_validity.get_bit(index));
+                values_values[index]
+            },
+            None => {
+                bitmap.push(false);
+                T::default()
+            },
+        })
+        .collect::<Vec<_>>();
+    (values.into(), bitmap.into())
+}
+
+/// `take` implementation for primitive arrays
+pub fn take<T: NativeType, I: Index>(
+    values: &PrimitiveArray<T>,
+    indices: &PrimitiveArray<I>,
+) -> PrimitiveArray<T> {
+    let indices_has_validity = indices.null_count() > 0;
+    let values_has_validity = values.null_count() > 0;
+    let (buffer, validity) = match (values_has_validity, indices_has_validity) {
+        (false, false) => take_no_validity::<T, I>(values.values(), indices.values()),
+        (true, false) => take_values_validity::<T, I>(values, indices.values()),
+        (false, true) => take_indices_validity::<T, I>(values.values(), indices),
+        (true, true) => take_values_indices_validity::<T, I>(values, indices),
+    };
+
+    PrimitiveArray::<T>::new(values.data_type().clone(), buffer, validity)
+}
diff --git a/crates/nano-arrow/src/compute/take/structure.rs b/crates/nano-arrow/src/compute/take/structure.rs
new file mode 100644
index 000000000000..e0a2717f5746
--- /dev/null
+++ b/crates/nano-arrow/src/compute/take/structure.rs
@@ -0,0 +1,63 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use super::Index;
+use crate::array::{Array, PrimitiveArray, StructArray};
+use crate::bitmap::{Bitmap, MutableBitmap};
+use crate::error::Result;
+
+#[inline]
+fn take_validity<I: Index>(
+    validity: Option<&Bitmap>,
+    indices: &PrimitiveArray<I>,
+) -> Result<Option<Bitmap>> {
+    let indices_validity = indices.validity();
+    match (validity, indices_validity) {
+        (None, _) => Ok(indices_validity.cloned()),
+        (Some(validity), None) => {
+            let iter = indices.values().iter().map(|index| {
+                let index = index.to_usize();
+                validity.get_bit(index)
+            });
+            Ok(MutableBitmap::from_trusted_len_iter(iter).into())
+        },
+        (Some(validity), _) => {
+            let iter = indices.iter().map(|x| match x {
+                Some(index) => {
+                    let index = index.to_usize();
+                    validity.get_bit(index)
+                },
+                None => false,
+            });
+            Ok(MutableBitmap::from_trusted_len_iter(iter).into())
+        },
+    }
+}
+
+pub fn take<I: Index>(array: &StructArray, indices: &PrimitiveArray<I>) -> Result<StructArray> {
+    let values: Vec<Box<dyn Array>> = array
+        .values()
+        .iter()
+        .map(|a| super::take(a.as_ref(), indices))
+        .collect::<Result<_>>()?;
+    let validity = take_validity(array.validity(), indices)?;
+    Ok(StructArray::new(
+        array.data_type().clone(),
+        values,
+        validity,
+    ))
+}
diff --git a/crates/nano-arrow/src/compute/take/utf8.rs b/crates/nano-arrow/src/compute/take/utf8.rs
new file mode 100644
index 000000000000..3f5f5877c12f
--- /dev/null
+++ b/crates/nano-arrow/src/compute/take/utf8.rs
@@ -0,0 +1,86 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use super::generic_binary::*;
+use super::Index;
+use crate::array::{Array, PrimitiveArray, Utf8Array};
+use crate::offset::Offset;
+
+/// `take` implementation for utf8 arrays
+pub fn take<O: Offset, I: Index>(
+    values: &Utf8Array<O>,
+    indices: &PrimitiveArray<I>,
+) -> Utf8Array<O> {
+    let data_type = values.data_type().clone();
+    let indices_has_validity = indices.null_count() > 0;
+    let values_has_validity = values.null_count() > 0;
+
+    let (offsets, values, validity) = match (values_has_validity, indices_has_validity) {
+        (false, false) => {
+            take_no_validity::<O, I>(values.offsets(), values.values(), indices.values())
+        },
+        (true, false) => take_values_validity(values, indices.values()),
+        (false, true) => take_indices_validity(values.offsets(), values.values(), indices),
+        (true, true) => take_values_indices_validity(values, indices),
+    };
+    unsafe { Utf8Array::<O>::new_unchecked(data_type, offsets, values, validity) }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::array::Int32Array;
+
+    fn _all_cases<O: Offset>() -> Vec<(Int32Array, Utf8Array<O>, Utf8Array<O>)> {
+        vec![
+            (
+                Int32Array::from(&[Some(1), Some(0)]),
+                Utf8Array::<O>::from(vec![Some("one"), Some("two")]),
+                Utf8Array::<O>::from(vec![Some("two"), Some("one")]),
+            ),
+            (
+                Int32Array::from(&[Some(1), None]),
+                Utf8Array::<O>::from(vec![Some("one"), Some("two")]),
+                Utf8Array::<O>::from(vec![Some("two"), None]),
+            ),
+            (
+                Int32Array::from(&[Some(1), Some(0)]),
+                Utf8Array::<O>::from(vec![None, Some("two")]),
+                Utf8Array::<O>::from(vec![Some("two"), None]),
+            ),
+            (
+                Int32Array::from(&[Some(1), None, Some(0)]),
+                Utf8Array::<O>::from(vec![None, Some("two")]),
+                Utf8Array::<O>::from(vec![Some("two"), None, None]),
+            ),
+        ]
+    }
+
+    #[test]
+    fn all_cases() {
+        let cases = _all_cases::<i32>();
+        for (indices, input, expected) in cases {
+            let output = take(&input, &indices);
+            assert_eq!(expected, output);
+        }
+        let cases = _all_cases::<i64>();
+        for (indices, input, expected) in cases {
+            let output = take(&input, &indices);
+            assert_eq!(expected, output);
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/compute/temporal.rs b/crates/nano-arrow/src/compute/temporal.rs
new file mode 100644
index 000000000000..132492f58b6e
--- /dev/null
+++ b/crates/nano-arrow/src/compute/temporal.rs
@@ -0,0 +1,410 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Defines temporal kernels for time and date related functions.
+
+use chrono::{Datelike, Timelike};
+
+use super::arity::unary;
+use crate::array::*;
+use crate::datatypes::*;
+use crate::error::{Error, Result};
+use crate::temporal_conversions::*;
+use crate::types::NativeType;
+
+// Create and implement a trait that converts chrono's `Weekday`
+// type into `u32`
+trait U32Weekday: Datelike {
+    fn u32_weekday(&self) -> u32 {
+        self.weekday().number_from_monday()
+    }
+}
+
+impl U32Weekday for chrono::NaiveDateTime {}
+impl<T: chrono::TimeZone> U32Weekday for chrono::DateTime<T> {}
+
+// Create and implement a trait that converts chrono's `IsoWeek`
+// type into `u32`
+trait U32IsoWeek: Datelike {
+    fn u32_iso_week(&self) -> u32 {
+        self.iso_week().week()
+    }
+}
+
+impl U32IsoWeek for chrono::NaiveDateTime {}
+impl<T: chrono::TimeZone> U32IsoWeek for chrono::DateTime<T> {}
+
+// Macro to avoid repetition in functions, that apply
+// `chrono::Datelike` methods on Arrays
+macro_rules! date_like {
+    ($extract:ident, $array:ident, $data_type:path) => {
+        match $array.data_type().to_logical_type() {
+            DataType::Date32 | DataType::Date64 | DataType::Timestamp(_, None) => {
+                date_variants($array, $data_type, |x| x.$extract())
+            },
+            DataType::Timestamp(time_unit, Some(timezone_str)) => {
+                let array = $array.as_any().downcast_ref().unwrap();
+
+                if let Ok(timezone) = parse_offset(timezone_str) {
+                    Ok(extract_impl(array, *time_unit, timezone, |x| x.$extract()))
+                } else {
+                    chrono_tz(array, *time_unit, timezone_str, |x| x.$extract())
+                }
+            },
+            dt => Err(Error::NotYetImplemented(format!(
+                "\"{}\" does not support type {:?}",
+                stringify!($extract),
+                dt
+            ))),
+        }
+    };
+}
+
+/// Extracts the years of a temporal array as [`PrimitiveArray<i32>`].
+/// Use [`can_year`] to check if this operation is supported for the target [`DataType`].
+pub fn year(array: &dyn Array) -> Result<PrimitiveArray<i32>> {
+    date_like!(year, array, DataType::Int32)
+}
+
+/// Extracts the months of a temporal array as [`PrimitiveArray<u32>`].
+/// Value ranges from 1 to 12.
+/// Use [`can_month`] to check if this operation is supported for the target [`DataType`].
+pub fn month(array: &dyn Array) -> Result<PrimitiveArray<u32>> {
+    date_like!(month, array, DataType::UInt32)
+}
+
+/// Extracts the days of a temporal array as [`PrimitiveArray<u32>`].
+/// Value ranges from 1 to 32 (Last day depends on month).
+/// Use [`can_day`] to check if this operation is supported for the target [`DataType`].
+pub fn day(array: &dyn Array) -> Result<PrimitiveArray<u32>> {
+    date_like!(day, array, DataType::UInt32)
+}
+
+/// Extracts weekday of a temporal array as [`PrimitiveArray<u32>`].
+/// Monday is 1, Tuesday is 2, ..., Sunday is 7.
+/// Use [`can_weekday`] to check if this operation is supported for the target [`DataType`]
+pub fn weekday(array: &dyn Array) -> Result<PrimitiveArray<u32>> {
+    date_like!(u32_weekday, array, DataType::UInt32)
+}
+
+/// Extracts ISO week of a temporal array as [`PrimitiveArray<u32>`]
+/// Value ranges from 1 to 53 (Last week depends on the year).
+/// Use [`can_iso_week`] to check if this operation is supported for the target [`DataType`]
+pub fn iso_week(array: &dyn Array) -> Result<PrimitiveArray<u32>> {
+    date_like!(u32_iso_week, array, DataType::UInt32)
+}
+
+// Macro to avoid repetition in functions, that apply
+// `chrono::Timelike` methods on Arrays
+macro_rules! time_like {
+    ($extract:ident, $array:ident, $data_type:path) => {
+        match $array.data_type().to_logical_type() {
+            DataType::Date32 | DataType::Date64 | DataType::Timestamp(_, None) => {
+                date_variants($array, $data_type, |x| x.$extract())
+            },
+            DataType::Time32(_) | DataType::Time64(_) => {
+                time_variants($array, DataType::UInt32, |x| x.$extract())
+            },
+            DataType::Timestamp(time_unit, Some(timezone_str)) => {
+                let array = $array.as_any().downcast_ref().unwrap();
+
+                if let Ok(timezone) = parse_offset(timezone_str) {
+                    Ok(extract_impl(array, *time_unit, timezone, |x| x.$extract()))
+                } else {
+                    chrono_tz(array, *time_unit, timezone_str, |x| x.$extract())
+                }
+            },
+            dt => Err(Error::NotYetImplemented(format!(
+                "\"{}\" does not support type {:?}",
+                stringify!($extract),
+                dt
+            ))),
+        }
+    };
+}
+
+/// Extracts the hours of a temporal array as [`PrimitiveArray<u32>`].
+/// Value ranges from 0 to 23.
+/// Use [`can_hour`] to check if this operation is supported for the target [`DataType`].
+pub fn hour(array: &dyn Array) -> Result<PrimitiveArray<u32>> {
+    time_like!(hour, array, DataType::UInt32)
+}
+
+/// Extracts the minutes of a temporal array as [`PrimitiveArray<u32>`].
+/// Value ranges from 0 to 59.
+/// Use [`can_minute`] to check if this operation is supported for the target [`DataType`].
+pub fn minute(array: &dyn Array) -> Result<PrimitiveArray<u32>> {
+    time_like!(minute, array, DataType::UInt32)
+}
+
+/// Extracts the seconds of a temporal array as [`PrimitiveArray<u32>`].
+/// Value ranges from 0 to 59.
+/// Use [`can_second`] to check if this operation is supported for the target [`DataType`].
+pub fn second(array: &dyn Array) -> Result<PrimitiveArray<u32>> {
+    time_like!(second, array, DataType::UInt32)
+}
+
+/// Extracts the nanoseconds of a temporal array as [`PrimitiveArray<u32>`].
+/// Use [`can_nanosecond`] to check if this operation is supported for the target [`DataType`].
+pub fn nanosecond(array: &dyn Array) -> Result<PrimitiveArray<u32>> {
+    time_like!(nanosecond, array, DataType::UInt32)
+}
+
+fn date_variants<F, O>(array: &dyn Array, data_type: DataType, op: F) -> Result<PrimitiveArray<O>>
+where
+    O: NativeType,
+    F: Fn(chrono::NaiveDateTime) -> O,
+{
+    match array.data_type().to_logical_type() {
+        DataType::Date32 => {
+            let array = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<i32>>()
+                .unwrap();
+            Ok(unary(array, |x| op(date32_to_datetime(x)), data_type))
+        },
+        DataType::Date64 => {
+            let array = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<i64>>()
+                .unwrap();
+            Ok(unary(array, |x| op(date64_to_datetime(x)), data_type))
+        },
+        DataType::Timestamp(time_unit, None) => {
+            let array = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<i64>>()
+                .unwrap();
+            let func = match time_unit {
+                TimeUnit::Second => timestamp_s_to_datetime,
+                TimeUnit::Millisecond => timestamp_ms_to_datetime,
+                TimeUnit::Microsecond => timestamp_us_to_datetime,
+                TimeUnit::Nanosecond => timestamp_ns_to_datetime,
+            };
+            Ok(unary(array, |x| op(func(x)), data_type))
+        },
+        _ => unreachable!(),
+    }
+}
+
+fn time_variants<F, O>(array: &dyn Array, data_type: DataType, op: F) -> Result<PrimitiveArray<O>>
+where
+    O: NativeType,
+    F: Fn(chrono::NaiveTime) -> O,
+{
+    match array.data_type().to_logical_type() {
+        DataType::Time32(TimeUnit::Second) => {
+            let array = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<i32>>()
+                .unwrap();
+            Ok(unary(array, |x| op(time32s_to_time(x)), data_type))
+        },
+        DataType::Time32(TimeUnit::Millisecond) => {
+            let array = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<i32>>()
+                .unwrap();
+            Ok(unary(array, |x| op(time32ms_to_time(x)), data_type))
+        },
+        DataType::Time64(TimeUnit::Microsecond) => {
+            let array = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<i64>>()
+                .unwrap();
+            Ok(unary(array, |x| op(time64us_to_time(x)), data_type))
+        },
+        DataType::Time64(TimeUnit::Nanosecond) => {
+            let array = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<i64>>()
+                .unwrap();
+            Ok(unary(array, |x| op(time64ns_to_time(x)), data_type))
+        },
+        _ => unreachable!(),
+    }
+}
+
+#[cfg(feature = "chrono-tz")]
+fn chrono_tz<F, O>(
+    array: &PrimitiveArray<i64>,
+    time_unit: TimeUnit,
+    timezone_str: &str,
+    op: F,
+) -> Result<PrimitiveArray<O>>
+where
+    O: NativeType,
+    F: Fn(chrono::DateTime<chrono_tz::Tz>) -> O,
+{
+    let timezone = parse_offset_tz(timezone_str)?;
+    Ok(extract_impl(array, time_unit, timezone, op))
+}
+
+#[cfg(not(feature = "chrono-tz"))]
+fn chrono_tz<F, O>(
+    _: &PrimitiveArray<i64>,
+    _: TimeUnit,
+    timezone_str: &str,
+    _: F,
+) -> Result<PrimitiveArray<O>>
+where
+    O: NativeType,
+    F: Fn(chrono::DateTime<chrono::FixedOffset>) -> O,
+{
+    Err(Error::InvalidArgumentError(format!(
+        "timezone \"{}\" cannot be parsed (feature chrono-tz is not active)",
+        timezone_str
+    )))
+}
+
+fn extract_impl<T, A, F>(
+    array: &PrimitiveArray<i64>,
+    time_unit: TimeUnit,
+    timezone: T,
+    extract: F,
+) -> PrimitiveArray<A>
+where
+    T: chrono::TimeZone,
+    A: NativeType,
+    F: Fn(chrono::DateTime<T>) -> A,
+{
+    match time_unit {
+        TimeUnit::Second => {
+            let op = |x| {
+                let datetime = timestamp_s_to_datetime(x);
+                let offset = timezone.offset_from_utc_datetime(&datetime);
+                extract(chrono::DateTime::<T>::from_naive_utc_and_offset(
+                    datetime, offset,
+                ))
+            };
+            unary(array, op, A::PRIMITIVE.into())
+        },
+        TimeUnit::Millisecond => {
+            let op = |x| {
+                let datetime = timestamp_ms_to_datetime(x);
+                let offset = timezone.offset_from_utc_datetime(&datetime);
+                extract(chrono::DateTime::<T>::from_naive_utc_and_offset(
+                    datetime, offset,
+                ))
+            };
+            unary(array, op, A::PRIMITIVE.into())
+        },
+        TimeUnit::Microsecond => {
+            let op = |x| {
+                let datetime = timestamp_us_to_datetime(x);
+                let offset = timezone.offset_from_utc_datetime(&datetime);
+                extract(chrono::DateTime::<T>::from_naive_utc_and_offset(
+                    datetime, offset,
+                ))
+            };
+            unary(array, op, A::PRIMITIVE.into())
+        },
+        TimeUnit::Nanosecond => {
+            let op = |x| {
+                let datetime = timestamp_ns_to_datetime(x);
+                let offset = timezone.offset_from_utc_datetime(&datetime);
+                extract(chrono::DateTime::<T>::from_naive_utc_and_offset(
+                    datetime, offset,
+                ))
+            };
+            unary(array, op, A::PRIMITIVE.into())
+        },
+    }
+}
+
+/// Checks if an array of type `datatype` can perform year operation
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::temporal::can_year;
+/// use arrow2::datatypes::{DataType};
+///
+/// assert_eq!(can_year(&DataType::Date32), true);
+/// assert_eq!(can_year(&DataType::Int8), false);
+/// ```
+pub fn can_year(data_type: &DataType) -> bool {
+    can_date(data_type)
+}
+
+/// Checks if an array of type `datatype` can perform month operation
+pub fn can_month(data_type: &DataType) -> bool {
+    can_date(data_type)
+}
+
+/// Checks if an array of type `datatype` can perform day operation
+pub fn can_day(data_type: &DataType) -> bool {
+    can_date(data_type)
+}
+
+/// Checks if an array of type `data_type` can perform weekday operation
+pub fn can_weekday(data_type: &DataType) -> bool {
+    can_date(data_type)
+}
+
+/// Checks if an array of type `data_type` can perform ISO week operation
+pub fn can_iso_week(data_type: &DataType) -> bool {
+    can_date(data_type)
+}
+
+fn can_date(data_type: &DataType) -> bool {
+    matches!(
+        data_type,
+        DataType::Date32 | DataType::Date64 | DataType::Timestamp(_, _)
+    )
+}
+
+/// Checks if an array of type `datatype` can perform hour operation
+///
+/// # Examples
+/// ```
+/// use arrow2::compute::temporal::can_hour;
+/// use arrow2::datatypes::{DataType, TimeUnit};
+///
+/// assert_eq!(can_hour(&DataType::Time32(TimeUnit::Second)), true);
+/// assert_eq!(can_hour(&DataType::Int8), false);
+/// ```
+pub fn can_hour(data_type: &DataType) -> bool {
+    can_time(data_type)
+}
+
+/// Checks if an array of type `datatype` can perform minute operation
+pub fn can_minute(data_type: &DataType) -> bool {
+    can_time(data_type)
+}
+
+/// Checks if an array of type `datatype` can perform second operation
+pub fn can_second(data_type: &DataType) -> bool {
+    can_time(data_type)
+}
+
+/// Checks if an array of type `datatype` can perform nanosecond operation
+pub fn can_nanosecond(data_type: &DataType) -> bool {
+    can_time(data_type)
+}
+
+fn can_time(data_type: &DataType) -> bool {
+    matches!(
+        data_type,
+        DataType::Time32(TimeUnit::Second)
+            | DataType::Time32(TimeUnit::Millisecond)
+            | DataType::Time64(TimeUnit::Microsecond)
+            | DataType::Time64(TimeUnit::Nanosecond)
+            | DataType::Date32
+            | DataType::Date64
+            | DataType::Timestamp(_, _)
+    )
+}
diff --git a/crates/nano-arrow/src/compute/utils.rs b/crates/nano-arrow/src/compute/utils.rs
new file mode 100644
index 000000000000..e06acdcd470c
--- /dev/null
+++ b/crates/nano-arrow/src/compute/utils.rs
@@ -0,0 +1,23 @@
+use crate::array::Array;
+use crate::bitmap::Bitmap;
+use crate::error::{Error, Result};
+
+pub fn combine_validities(lhs: Option<&Bitmap>, rhs: Option<&Bitmap>) -> Option<Bitmap> {
+    match (lhs, rhs) {
+        (Some(lhs), None) => Some(lhs.clone()),
+        (None, Some(rhs)) => Some(rhs.clone()),
+        (None, None) => None,
+        (Some(lhs), Some(rhs)) => Some(lhs & rhs),
+    }
+}
+
+// Errors iff the two arrays have a different length.
+#[inline]
+pub fn check_same_len(lhs: &dyn Array, rhs: &dyn Array) -> Result<()> {
+    if lhs.len() != rhs.len() {
+        return Err(Error::InvalidArgumentError(
+            "Arrays must have the same length".to_string(),
+        ));
+    }
+    Ok(())
+}
diff --git a/crates/nano-arrow/src/datatypes/field.rs b/crates/nano-arrow/src/datatypes/field.rs
new file mode 100644
index 000000000000..489cacb0b5b5
--- /dev/null
+++ b/crates/nano-arrow/src/datatypes/field.rs
@@ -0,0 +1,96 @@
+#[cfg(feature = "serde_types")]
+use serde_derive::{Deserialize, Serialize};
+
+use super::{DataType, Metadata};
+
+/// Represents Arrow's metadata of a "column".
+///
+/// A [`Field`] is the closest representation of the traditional "column": a logical type
+/// ([`DataType`]) with a name and nullability.
+/// A Field has optional [`Metadata`] that can be used to annotate the field with custom metadata.
+///
+/// Almost all IO in this crate uses [`Field`] to represent logical information about the data
+/// to be serialized.
+#[derive(Debug, Clone, Eq, PartialEq, Hash)]
+#[cfg_attr(feature = "serde_types", derive(Serialize, Deserialize))]
+pub struct Field {
+    /// Its name
+    pub name: String,
+    /// Its logical [`DataType`]
+    pub data_type: DataType,
+    /// Its nullability
+    pub is_nullable: bool,
+    /// Additional custom (opaque) metadata.
+    pub metadata: Metadata,
+}
+
+impl Field {
+    /// Creates a new [`Field`].
+    pub fn new<T: Into<String>>(name: T, data_type: DataType, is_nullable: bool) -> Self {
+        Field {
+            name: name.into(),
+            data_type,
+            is_nullable,
+            metadata: Default::default(),
+        }
+    }
+
+    /// Creates a new [`Field`] with metadata.
+    #[inline]
+    pub fn with_metadata(self, metadata: Metadata) -> Self {
+        Self {
+            name: self.name,
+            data_type: self.data_type,
+            is_nullable: self.is_nullable,
+            metadata,
+        }
+    }
+
+    /// Returns the [`Field`]'s [`DataType`].
+    #[inline]
+    pub fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+}
+
+#[cfg(feature = "arrow")]
+impl From<Field> for arrow_schema::Field {
+    fn from(value: Field) -> Self {
+        Self::new(value.name, value.data_type.into(), value.is_nullable)
+            .with_metadata(value.metadata.into_iter().collect())
+    }
+}
+
+#[cfg(feature = "arrow")]
+impl From<arrow_schema::Field> for Field {
+    fn from(value: arrow_schema::Field) -> Self {
+        (&value).into()
+    }
+}
+
+#[cfg(feature = "arrow")]
+impl From<&arrow_schema::Field> for Field {
+    fn from(value: &arrow_schema::Field) -> Self {
+        let data_type = value.data_type().clone().into();
+        let metadata = value
+            .metadata()
+            .iter()
+            .map(|(k, v)| (k.clone(), v.clone()))
+            .collect();
+        Self::new(value.name(), data_type, value.is_nullable()).with_metadata(metadata)
+    }
+}
+
+#[cfg(feature = "arrow")]
+impl From<arrow_schema::FieldRef> for Field {
+    fn from(value: arrow_schema::FieldRef) -> Self {
+        value.as_ref().into()
+    }
+}
+
+#[cfg(feature = "arrow")]
+impl From<&arrow_schema::FieldRef> for Field {
+    fn from(value: &arrow_schema::FieldRef) -> Self {
+        value.as_ref().into()
+    }
+}
diff --git a/crates/nano-arrow/src/datatypes/mod.rs b/crates/nano-arrow/src/datatypes/mod.rs
new file mode 100644
index 000000000000..7487af3a0a9a
--- /dev/null
+++ b/crates/nano-arrow/src/datatypes/mod.rs
@@ -0,0 +1,513 @@
+#![forbid(unsafe_code)]
+//! Contains all metadata, such as [`PhysicalType`], [`DataType`], [`Field`] and [`Schema`].
+
+mod field;
+mod physical_type;
+mod schema;
+
+use std::collections::BTreeMap;
+use std::sync::Arc;
+
+pub use field::Field;
+pub use physical_type::*;
+pub use schema::Schema;
+#[cfg(feature = "serde_types")]
+use serde_derive::{Deserialize, Serialize};
+
+/// typedef for [BTreeMap<String, String>] denoting [`Field`]'s and [`Schema`]'s metadata.
+pub type Metadata = BTreeMap<String, String>;
+/// typedef for [Option<(String, Option<String>)>] descr
+pub(crate) type Extension = Option<(String, Option<String>)>;
+
+/// The set of supported logical types in this crate.
+///
+/// Each variant uniquely identifies a logical type, which define specific semantics to the data
+/// (e.g. how it should be represented).
+/// Each variant has a corresponding [`PhysicalType`], obtained via [`DataType::to_physical_type`],
+/// which declares the in-memory representation of data.
+/// The [`DataType::Extension`] is special in that it augments a [`DataType`] with metadata to support custom types.
+/// Use `to_logical_type` to desugar such type and return its corresponding logical type.
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde_types", derive(Serialize, Deserialize))]
+pub enum DataType {
+    /// Null type
+    Null,
+    /// `true` and `false`.
+    Boolean,
+    /// An [`i8`]
+    Int8,
+    /// An [`i16`]
+    Int16,
+    /// An [`i32`]
+    Int32,
+    /// An [`i64`]
+    Int64,
+    /// An [`u8`]
+    UInt8,
+    /// An [`u16`]
+    UInt16,
+    /// An [`u32`]
+    UInt32,
+    /// An [`u64`]
+    UInt64,
+    /// An 16-bit float
+    Float16,
+    /// A [`f32`]
+    Float32,
+    /// A [`f64`]
+    Float64,
+    /// A [`i64`] representing a timestamp measured in [`TimeUnit`] with an optional timezone.
+    ///
+    /// Time is measured as a Unix epoch, counting the seconds from
+    /// 00:00:00.000 on 1 January 1970, excluding leap seconds,
+    /// as a 64-bit signed integer.
+    ///
+    /// The time zone is a string indicating the name of a time zone, one of:
+    ///
+    /// * As used in the Olson time zone database (the "tz database" or
+    ///   "tzdata"), such as "America/New_York"
+    /// * An absolute time zone offset of the form +XX:XX or -XX:XX, such as +07:30
+    /// When the timezone is not specified, the timestamp is considered to have no timezone
+    /// and is represented _as is_
+    Timestamp(TimeUnit, Option<String>),
+    /// An [`i32`] representing the elapsed time since UNIX epoch (1970-01-01)
+    /// in days.
+    Date32,
+    /// An [`i64`] representing the elapsed time since UNIX epoch (1970-01-01)
+    /// in milliseconds. Values are evenly divisible by 86400000.
+    Date64,
+    /// A 32-bit time representing the elapsed time since midnight in the unit of `TimeUnit`.
+    /// Only [`TimeUnit::Second`] and [`TimeUnit::Millisecond`] are supported on this variant.
+    Time32(TimeUnit),
+    /// A 64-bit time representing the elapsed time since midnight in the unit of `TimeUnit`.
+    /// Only [`TimeUnit::Microsecond`] and [`TimeUnit::Nanosecond`] are supported on this variant.
+    Time64(TimeUnit),
+    /// Measure of elapsed time. This elapsed time is a physical duration (i.e. 1s as defined in S.I.)
+    Duration(TimeUnit),
+    /// A "calendar" interval modeling elapsed time that takes into account calendar shifts.
+    /// For example an interval of 1 day may represent more than 24 hours.
+    Interval(IntervalUnit),
+    /// Opaque binary data of variable length whose offsets are represented as [`i32`].
+    Binary,
+    /// Opaque binary data of fixed size.
+    /// Enum parameter specifies the number of bytes per value.
+    FixedSizeBinary(usize),
+    /// Opaque binary data of variable length whose offsets are represented as [`i64`].
+    LargeBinary,
+    /// A variable-length UTF-8 encoded string whose offsets are represented as [`i32`].
+    Utf8,
+    /// A variable-length UTF-8 encoded string whose offsets are represented as [`i64`].
+    LargeUtf8,
+    /// A list of some logical data type whose offsets are represented as [`i32`].
+    List(Box<Field>),
+    /// A list of some logical data type with a fixed number of elements.
+    FixedSizeList(Box<Field>, usize),
+    /// A list of some logical data type whose offsets are represented as [`i64`].
+    LargeList(Box<Field>),
+    /// A nested [`DataType`] with a given number of [`Field`]s.
+    Struct(Vec<Field>),
+    /// A nested datatype that can represent slots of differing types.
+    /// Third argument represents mode
+    Union(Vec<Field>, Option<Vec<i32>>, UnionMode),
+    /// A nested type that is represented as
+    ///
+    /// List<entries: Struct<key: K, value: V>>
+    ///
+    /// In this layout, the keys and values are each respectively contiguous. We do
+    /// not constrain the key and value types, so the application is responsible
+    /// for ensuring that the keys are hashable and unique. Whether the keys are sorted
+    /// may be set in the metadata for this field.
+    ///
+    /// In a field with Map type, the field has a child Struct field, which then
+    /// has two children: key type and the second the value type. The names of the
+    /// child fields may be respectively "entries", "key", and "value", but this is
+    /// not enforced.
+    ///
+    /// Map
+    /// ```text
+    ///   - child[0] entries: Struct
+    ///     - child[0] key: K
+    ///     - child[1] value: V
+    /// ```
+    /// Neither the "entries" field nor the "key" field may be nullable.
+    ///
+    /// The metadata is structured so that Arrow systems without special handling
+    /// for Map can make Map an alias for List. The "layout" attribute for the Map
+    /// field must have the same contents as a List.
+    Map(Box<Field>, bool),
+    /// A dictionary encoded array (`key_type`, `value_type`), where
+    /// each array element is an index of `key_type` into an
+    /// associated dictionary of `value_type`.
+    ///
+    /// Dictionary arrays are used to store columns of `value_type`
+    /// that contain many repeated values using less memory, but with
+    /// a higher CPU overhead for some operations.
+    ///
+    /// This type mostly used to represent low cardinality string
+    /// arrays or a limited set of primitive types as integers.
+    ///
+    /// The `bool` value indicates the `Dictionary` is sorted if set to `true`.
+    Dictionary(IntegerType, Box<DataType>, bool),
+    /// Decimal value with precision and scale
+    /// precision is the number of digits in the number and
+    /// scale is the number of decimal places.
+    /// The number 999.99 has a precision of 5 and scale of 2.
+    Decimal(usize, usize),
+    /// Decimal backed by 256 bits
+    Decimal256(usize, usize),
+    /// Extension type.
+    Extension(String, Box<DataType>, Option<String>),
+}
+
+#[cfg(feature = "arrow")]
+impl From<DataType> for arrow_schema::DataType {
+    fn from(value: DataType) -> Self {
+        use arrow_schema::{Field as ArrowField, UnionFields};
+
+        match value {
+            DataType::Null => Self::Null,
+            DataType::Boolean => Self::Boolean,
+            DataType::Int8 => Self::Int8,
+            DataType::Int16 => Self::Int16,
+            DataType::Int32 => Self::Int32,
+            DataType::Int64 => Self::Int64,
+            DataType::UInt8 => Self::UInt8,
+            DataType::UInt16 => Self::UInt16,
+            DataType::UInt32 => Self::UInt32,
+            DataType::UInt64 => Self::UInt64,
+            DataType::Float16 => Self::Float16,
+            DataType::Float32 => Self::Float32,
+            DataType::Float64 => Self::Float64,
+            DataType::Timestamp(unit, tz) => Self::Timestamp(unit.into(), tz.map(Into::into)),
+            DataType::Date32 => Self::Date32,
+            DataType::Date64 => Self::Date64,
+            DataType::Time32(unit) => Self::Time32(unit.into()),
+            DataType::Time64(unit) => Self::Time64(unit.into()),
+            DataType::Duration(unit) => Self::Duration(unit.into()),
+            DataType::Interval(unit) => Self::Interval(unit.into()),
+            DataType::Binary => Self::Binary,
+            DataType::FixedSizeBinary(size) => Self::FixedSizeBinary(size as _),
+            DataType::LargeBinary => Self::LargeBinary,
+            DataType::Utf8 => Self::Utf8,
+            DataType::LargeUtf8 => Self::LargeUtf8,
+            DataType::List(f) => Self::List(Arc::new((*f).into())),
+            DataType::FixedSizeList(f, size) => {
+                Self::FixedSizeList(Arc::new((*f).into()), size as _)
+            },
+            DataType::LargeList(f) => Self::LargeList(Arc::new((*f).into())),
+            DataType::Struct(f) => Self::Struct(f.into_iter().map(ArrowField::from).collect()),
+            DataType::Union(fields, Some(ids), mode) => {
+                let ids = ids.into_iter().map(|x| x as _);
+                let fields = fields.into_iter().map(ArrowField::from);
+                Self::Union(UnionFields::new(ids, fields), mode.into())
+            },
+            DataType::Union(fields, None, mode) => {
+                let ids = 0..fields.len() as i8;
+                let fields = fields.into_iter().map(ArrowField::from);
+                Self::Union(UnionFields::new(ids, fields), mode.into())
+            },
+            DataType::Map(f, ordered) => Self::Map(Arc::new((*f).into()), ordered),
+            DataType::Dictionary(key, value, _) => Self::Dictionary(
+                Box::new(DataType::from(key).into()),
+                Box::new((*value).into()),
+            ),
+            DataType::Decimal(precision, scale) => Self::Decimal128(precision as _, scale as _),
+            DataType::Decimal256(precision, scale) => Self::Decimal256(precision as _, scale as _),
+            DataType::Extension(_, d, _) => (*d).into(),
+        }
+    }
+}
+
+#[cfg(feature = "arrow")]
+impl From<arrow_schema::DataType> for DataType {
+    fn from(value: arrow_schema::DataType) -> Self {
+        use arrow_schema::DataType;
+        match value {
+            DataType::Null => Self::Null,
+            DataType::Boolean => Self::Boolean,
+            DataType::Int8 => Self::Int8,
+            DataType::Int16 => Self::Int16,
+            DataType::Int32 => Self::Int32,
+            DataType::Int64 => Self::Int64,
+            DataType::UInt8 => Self::UInt8,
+            DataType::UInt16 => Self::UInt16,
+            DataType::UInt32 => Self::UInt32,
+            DataType::UInt64 => Self::UInt64,
+            DataType::Float16 => Self::Float16,
+            DataType::Float32 => Self::Float32,
+            DataType::Float64 => Self::Float64,
+            DataType::Timestamp(unit, tz) => {
+                Self::Timestamp(unit.into(), tz.map(|x| x.to_string()))
+            },
+            DataType::Date32 => Self::Date32,
+            DataType::Date64 => Self::Date64,
+            DataType::Time32(unit) => Self::Time32(unit.into()),
+            DataType::Time64(unit) => Self::Time64(unit.into()),
+            DataType::Duration(unit) => Self::Duration(unit.into()),
+            DataType::Interval(unit) => Self::Interval(unit.into()),
+            DataType::Binary => Self::Binary,
+            DataType::FixedSizeBinary(size) => Self::FixedSizeBinary(size as _),
+            DataType::LargeBinary => Self::LargeBinary,
+            DataType::Utf8 => Self::Utf8,
+            DataType::LargeUtf8 => Self::LargeUtf8,
+            DataType::List(f) => Self::List(Box::new(f.into())),
+            DataType::FixedSizeList(f, size) => Self::FixedSizeList(Box::new(f.into()), size as _),
+            DataType::LargeList(f) => Self::LargeList(Box::new(f.into())),
+            DataType::Struct(f) => Self::Struct(f.into_iter().map(Into::into).collect()),
+            DataType::Union(fields, mode) => {
+                let ids = fields.iter().map(|(x, _)| x as _).collect();
+                let fields = fields.iter().map(|(_, f)| f.into()).collect();
+                Self::Union(fields, Some(ids), mode.into())
+            },
+            DataType::Map(f, ordered) => Self::Map(Box::new(f.into()), ordered),
+            DataType::Dictionary(key, value) => {
+                let key = match *key {
+                    DataType::Int8 => IntegerType::Int8,
+                    DataType::Int16 => IntegerType::Int16,
+                    DataType::Int32 => IntegerType::Int32,
+                    DataType::Int64 => IntegerType::Int64,
+                    DataType::UInt8 => IntegerType::UInt8,
+                    DataType::UInt16 => IntegerType::UInt16,
+                    DataType::UInt32 => IntegerType::UInt32,
+                    DataType::UInt64 => IntegerType::UInt64,
+                    d => panic!("illegal dictionary key type: {d}"),
+                };
+                Self::Dictionary(key, Box::new((*value).into()), false)
+            },
+            DataType::Decimal128(precision, scale) => Self::Decimal(precision as _, scale as _),
+            DataType::Decimal256(precision, scale) => Self::Decimal256(precision as _, scale as _),
+            DataType::RunEndEncoded(_, _) => panic!("Run-end encoding not supported by arrow2"),
+        }
+    }
+}
+
+/// Mode of [`DataType::Union`]
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde_types", derive(Serialize, Deserialize))]
+pub enum UnionMode {
+    /// Dense union
+    Dense,
+    /// Sparse union
+    Sparse,
+}
+
+#[cfg(feature = "arrow")]
+impl From<UnionMode> for arrow_schema::UnionMode {
+    fn from(value: UnionMode) -> Self {
+        match value {
+            UnionMode::Dense => Self::Dense,
+            UnionMode::Sparse => Self::Sparse,
+        }
+    }
+}
+
+#[cfg(feature = "arrow")]
+impl From<arrow_schema::UnionMode> for UnionMode {
+    fn from(value: arrow_schema::UnionMode) -> Self {
+        match value {
+            arrow_schema::UnionMode::Dense => Self::Dense,
+            arrow_schema::UnionMode::Sparse => Self::Sparse,
+        }
+    }
+}
+
+impl UnionMode {
+    /// Constructs a [`UnionMode::Sparse`] if the input bool is true,
+    /// or otherwise constructs a [`UnionMode::Dense`]
+    pub fn sparse(is_sparse: bool) -> Self {
+        if is_sparse {
+            Self::Sparse
+        } else {
+            Self::Dense
+        }
+    }
+
+    /// Returns whether the mode is sparse
+    pub fn is_sparse(&self) -> bool {
+        matches!(self, Self::Sparse)
+    }
+
+    /// Returns whether the mode is dense
+    pub fn is_dense(&self) -> bool {
+        matches!(self, Self::Dense)
+    }
+}
+
+/// The time units defined in Arrow.
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde_types", derive(Serialize, Deserialize))]
+pub enum TimeUnit {
+    /// Time in seconds.
+    Second,
+    /// Time in milliseconds.
+    Millisecond,
+    /// Time in microseconds.
+    Microsecond,
+    /// Time in nanoseconds.
+    Nanosecond,
+}
+
+#[cfg(feature = "arrow")]
+impl From<TimeUnit> for arrow_schema::TimeUnit {
+    fn from(value: TimeUnit) -> Self {
+        match value {
+            TimeUnit::Nanosecond => Self::Nanosecond,
+            TimeUnit::Millisecond => Self::Millisecond,
+            TimeUnit::Microsecond => Self::Microsecond,
+            TimeUnit::Second => Self::Second,
+        }
+    }
+}
+
+#[cfg(feature = "arrow")]
+impl From<arrow_schema::TimeUnit> for TimeUnit {
+    fn from(value: arrow_schema::TimeUnit) -> Self {
+        match value {
+            arrow_schema::TimeUnit::Nanosecond => Self::Nanosecond,
+            arrow_schema::TimeUnit::Millisecond => Self::Millisecond,
+            arrow_schema::TimeUnit::Microsecond => Self::Microsecond,
+            arrow_schema::TimeUnit::Second => Self::Second,
+        }
+    }
+}
+
+/// Interval units defined in Arrow
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde_types", derive(Serialize, Deserialize))]
+pub enum IntervalUnit {
+    /// The number of elapsed whole months.
+    YearMonth,
+    /// The number of elapsed days and milliseconds,
+    /// stored as 2 contiguous `i32`
+    DayTime,
+    /// The number of elapsed months (i32), days (i32) and nanoseconds (i64).
+    MonthDayNano,
+}
+
+#[cfg(feature = "arrow")]
+impl From<IntervalUnit> for arrow_schema::IntervalUnit {
+    fn from(value: IntervalUnit) -> Self {
+        match value {
+            IntervalUnit::YearMonth => Self::YearMonth,
+            IntervalUnit::DayTime => Self::DayTime,
+            IntervalUnit::MonthDayNano => Self::MonthDayNano,
+        }
+    }
+}
+
+#[cfg(feature = "arrow")]
+impl From<arrow_schema::IntervalUnit> for IntervalUnit {
+    fn from(value: arrow_schema::IntervalUnit) -> Self {
+        match value {
+            arrow_schema::IntervalUnit::YearMonth => Self::YearMonth,
+            arrow_schema::IntervalUnit::DayTime => Self::DayTime,
+            arrow_schema::IntervalUnit::MonthDayNano => Self::MonthDayNano,
+        }
+    }
+}
+
+impl DataType {
+    /// the [`PhysicalType`] of this [`DataType`].
+    pub fn to_physical_type(&self) -> PhysicalType {
+        use DataType::*;
+        match self {
+            Null => PhysicalType::Null,
+            Boolean => PhysicalType::Boolean,
+            Int8 => PhysicalType::Primitive(PrimitiveType::Int8),
+            Int16 => PhysicalType::Primitive(PrimitiveType::Int16),
+            Int32 | Date32 | Time32(_) | Interval(IntervalUnit::YearMonth) => {
+                PhysicalType::Primitive(PrimitiveType::Int32)
+            },
+            Int64 | Date64 | Timestamp(_, _) | Time64(_) | Duration(_) => {
+                PhysicalType::Primitive(PrimitiveType::Int64)
+            },
+            Decimal(_, _) => PhysicalType::Primitive(PrimitiveType::Int128),
+            Decimal256(_, _) => PhysicalType::Primitive(PrimitiveType::Int256),
+            UInt8 => PhysicalType::Primitive(PrimitiveType::UInt8),
+            UInt16 => PhysicalType::Primitive(PrimitiveType::UInt16),
+            UInt32 => PhysicalType::Primitive(PrimitiveType::UInt32),
+            UInt64 => PhysicalType::Primitive(PrimitiveType::UInt64),
+            Float16 => PhysicalType::Primitive(PrimitiveType::Float16),
+            Float32 => PhysicalType::Primitive(PrimitiveType::Float32),
+            Float64 => PhysicalType::Primitive(PrimitiveType::Float64),
+            Interval(IntervalUnit::DayTime) => PhysicalType::Primitive(PrimitiveType::DaysMs),
+            Interval(IntervalUnit::MonthDayNano) => {
+                PhysicalType::Primitive(PrimitiveType::MonthDayNano)
+            },
+            Binary => PhysicalType::Binary,
+            FixedSizeBinary(_) => PhysicalType::FixedSizeBinary,
+            LargeBinary => PhysicalType::LargeBinary,
+            Utf8 => PhysicalType::Utf8,
+            LargeUtf8 => PhysicalType::LargeUtf8,
+            List(_) => PhysicalType::List,
+            FixedSizeList(_, _) => PhysicalType::FixedSizeList,
+            LargeList(_) => PhysicalType::LargeList,
+            Struct(_) => PhysicalType::Struct,
+            Union(_, _, _) => PhysicalType::Union,
+            Map(_, _) => PhysicalType::Map,
+            Dictionary(key, _, _) => PhysicalType::Dictionary(*key),
+            Extension(_, key, _) => key.to_physical_type(),
+        }
+    }
+
+    /// Returns `&self` for all but [`DataType::Extension`]. For [`DataType::Extension`],
+    /// (recursively) returns the inner [`DataType`].
+    /// Never returns the variant [`DataType::Extension`].
+    pub fn to_logical_type(&self) -> &DataType {
+        use DataType::*;
+        match self {
+            Extension(_, key, _) => key.to_logical_type(),
+            _ => self,
+        }
+    }
+}
+
+impl From<IntegerType> for DataType {
+    fn from(item: IntegerType) -> Self {
+        match item {
+            IntegerType::Int8 => DataType::Int8,
+            IntegerType::Int16 => DataType::Int16,
+            IntegerType::Int32 => DataType::Int32,
+            IntegerType::Int64 => DataType::Int64,
+            IntegerType::UInt8 => DataType::UInt8,
+            IntegerType::UInt16 => DataType::UInt16,
+            IntegerType::UInt32 => DataType::UInt32,
+            IntegerType::UInt64 => DataType::UInt64,
+        }
+    }
+}
+
+impl From<PrimitiveType> for DataType {
+    fn from(item: PrimitiveType) -> Self {
+        match item {
+            PrimitiveType::Int8 => DataType::Int8,
+            PrimitiveType::Int16 => DataType::Int16,
+            PrimitiveType::Int32 => DataType::Int32,
+            PrimitiveType::Int64 => DataType::Int64,
+            PrimitiveType::UInt8 => DataType::UInt8,
+            PrimitiveType::UInt16 => DataType::UInt16,
+            PrimitiveType::UInt32 => DataType::UInt32,
+            PrimitiveType::UInt64 => DataType::UInt64,
+            PrimitiveType::Int128 => DataType::Decimal(32, 32),
+            PrimitiveType::Int256 => DataType::Decimal256(32, 32),
+            PrimitiveType::Float16 => DataType::Float16,
+            PrimitiveType::Float32 => DataType::Float32,
+            PrimitiveType::Float64 => DataType::Float64,
+            PrimitiveType::DaysMs => DataType::Interval(IntervalUnit::DayTime),
+            PrimitiveType::MonthDayNano => DataType::Interval(IntervalUnit::MonthDayNano),
+        }
+    }
+}
+
+/// typedef for [`Arc<Schema>`].
+pub type SchemaRef = Arc<Schema>;
+
+/// support get extension for metadata
+pub fn get_extension(metadata: &Metadata) -> Extension {
+    if let Some(name) = metadata.get("ARROW:extension:name") {
+        let metadata = metadata.get("ARROW:extension:metadata").cloned();
+        Some((name.clone(), metadata))
+    } else {
+        None
+    }
+}
diff --git a/crates/nano-arrow/src/datatypes/physical_type.rs b/crates/nano-arrow/src/datatypes/physical_type.rs
new file mode 100644
index 000000000000..1e57fcf936bc
--- /dev/null
+++ b/crates/nano-arrow/src/datatypes/physical_type.rs
@@ -0,0 +1,76 @@
+#[cfg(feature = "serde_types")]
+use serde_derive::{Deserialize, Serialize};
+
+pub use crate::types::PrimitiveType;
+
+/// The set of physical types: unique in-memory representations of an Arrow array.
+/// A physical type has a one-to-many relationship with a [`crate::datatypes::DataType`] and
+/// a one-to-one mapping to each struct in this crate that implements [`crate::array::Array`].
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde_types", derive(Serialize, Deserialize))]
+pub enum PhysicalType {
+    /// A Null with no allocation.
+    Null,
+    /// A boolean represented as a single bit.
+    Boolean,
+    /// An array where each slot has a known compile-time size.
+    Primitive(PrimitiveType),
+    /// Opaque binary data of variable length.
+    Binary,
+    /// Opaque binary data of fixed size.
+    FixedSizeBinary,
+    /// Opaque binary data of variable length and 64-bit offsets.
+    LargeBinary,
+    /// A variable-length string in Unicode with UTF-8 encoding.
+    Utf8,
+    /// A variable-length string in Unicode with UFT-8 encoding and 64-bit offsets.
+    LargeUtf8,
+    /// A list of some data type with variable length.
+    List,
+    /// A list of some data type with fixed length.
+    FixedSizeList,
+    /// A list of some data type with variable length and 64-bit offsets.
+    LargeList,
+    /// A nested type that contains an arbitrary number of fields.
+    Struct,
+    /// A nested type that represents slots of differing types.
+    Union,
+    /// A nested type.
+    Map,
+    /// A dictionary encoded array by `IntegerType`.
+    Dictionary(IntegerType),
+}
+
+impl PhysicalType {
+    /// Whether this physical type equals [`PhysicalType::Primitive`] of type `primitive`.
+    pub fn eq_primitive(&self, primitive: PrimitiveType) -> bool {
+        if let Self::Primitive(o) = self {
+            o == &primitive
+        } else {
+            false
+        }
+    }
+}
+
+/// the set of valid indices types of a dictionary-encoded Array.
+/// Each type corresponds to a variant of [`crate::array::DictionaryArray`].
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde_types", derive(Serialize, Deserialize))]
+pub enum IntegerType {
+    /// A signed 8-bit integer.
+    Int8,
+    /// A signed 16-bit integer.
+    Int16,
+    /// A signed 32-bit integer.
+    Int32,
+    /// A signed 64-bit integer.
+    Int64,
+    /// An unsigned 8-bit integer.
+    UInt8,
+    /// An unsigned 16-bit integer.
+    UInt16,
+    /// An unsigned 32-bit integer.
+    UInt32,
+    /// An unsigned 64-bit integer.
+    UInt64,
+}
diff --git a/crates/nano-arrow/src/datatypes/schema.rs b/crates/nano-arrow/src/datatypes/schema.rs
new file mode 100644
index 000000000000..d01f1937d2ed
--- /dev/null
+++ b/crates/nano-arrow/src/datatypes/schema.rs
@@ -0,0 +1,60 @@
+#[cfg(feature = "serde_types")]
+use serde_derive::{Deserialize, Serialize};
+
+use super::{Field, Metadata};
+
+/// An ordered sequence of [`Field`]s with associated [`Metadata`].
+///
+/// [`Schema`] is an abstraction used to read from, and write to, Arrow IPC format,
+/// Apache Parquet, and Apache Avro. All these formats have a concept of a schema
+/// with fields and metadata.
+#[derive(Debug, Clone, PartialEq, Eq, Default)]
+#[cfg_attr(feature = "serde_types", derive(Serialize, Deserialize))]
+pub struct Schema {
+    /// The fields composing this schema.
+    pub fields: Vec<Field>,
+    /// Optional metadata.
+    pub metadata: Metadata,
+}
+
+impl Schema {
+    /// Attaches a [`Metadata`] to [`Schema`]
+    #[inline]
+    pub fn with_metadata(self, metadata: Metadata) -> Self {
+        Self {
+            fields: self.fields,
+            metadata,
+        }
+    }
+
+    /// Returns a new [`Schema`] with a subset of all fields whose `predicate`
+    /// evaluates to true.
+    pub fn filter<F: Fn(usize, &Field) -> bool>(self, predicate: F) -> Self {
+        let fields = self
+            .fields
+            .into_iter()
+            .enumerate()
+            .filter_map(|(index, f)| {
+                if (predicate)(index, &f) {
+                    Some(f)
+                } else {
+                    None
+                }
+            })
+            .collect();
+
+        Schema {
+            fields,
+            metadata: self.metadata,
+        }
+    }
+}
+
+impl From<Vec<Field>> for Schema {
+    fn from(fields: Vec<Field>) -> Self {
+        Self {
+            fields,
+            ..Default::default()
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/doc/lib.md b/crates/nano-arrow/src/doc/lib.md
new file mode 100644
index 000000000000..a1b57945c020
--- /dev/null
+++ b/crates/nano-arrow/src/doc/lib.md
@@ -0,0 +1,87 @@
+Welcome to arrow2's documentation. Thanks for checking it out!
+
+This is a library for efficient in-memory data operations with
+[Arrow in-memory format](https://arrow.apache.org/docs/format/Columnar.html).
+It is a re-write from the bottom up of the official `arrow` crate with soundness
+and type safety in mind.
+
+Check out [the guide](https://jorgecarleitao.github.io/arrow2/main/guide/) for an introduction.
+Below is an example of some of the things you can do with it:
+
+```rust
+use std::sync::Arc;
+
+use arrow2::array::*;
+use arrow2::datatypes::{Field, DataType, Schema};
+use arrow2::compute::arithmetics;
+use arrow2::error::Result;
+use arrow2::io::parquet::write::*;
+use arrow2::chunk::Chunk;
+
+fn main() -> Result<()> {
+    // declare arrays
+    let a = Int32Array::from(&[Some(1), None, Some(3)]);
+    let b = Int32Array::from(&[Some(2), None, Some(6)]);
+
+    // compute (probably the fastest implementation of a nullable op you can find out there)
+    let c = arithmetics::basic::mul_scalar(&a, &2);
+    assert_eq!(c, b);
+
+    // declare a schema with fields
+    let schema = Schema::from(vec![
+        Field::new("c1", DataType::Int32, true),
+        Field::new("c2", DataType::Int32, true),
+    ]);
+
+    // declare chunk
+    let chunk = Chunk::new(vec![a.arced(), b.arced()]);
+
+    // write to parquet (probably the fastest implementation of writing to parquet out there)
+
+    let options = WriteOptions {
+        write_statistics: true,
+        compression: CompressionOptions::Snappy,
+        version: Version::V1,
+        data_pagesize_limit: None,
+    };
+
+    let row_groups = RowGroupIterator::try_new(
+        vec![Ok(chunk)].into_iter(),
+        &schema,
+        options,
+        vec![vec![Encoding::Plain], vec![Encoding::Plain]],
+    )?;
+
+    // anything implementing `std::io::Write` works
+    let mut file = vec![];
+
+    let mut writer = FileWriter::try_new(file, schema, options)?;
+
+    // Write the file.
+    for group in row_groups {
+        writer.write(group?)?;
+    }
+    let _ = writer.end(None)?;
+    Ok(())
+}
+```
+
+## Cargo features
+
+This crate has a significant number of cargo features to reduce compilation
+time and number of dependencies. The feature `"full"` activates most
+functionality, such as:
+
+- `io_ipc`: to interact with the Arrow IPC format
+- `io_ipc_compression`: to read and write compressed Arrow IPC (v2)
+- `io_csv` to read and write CSV
+- `io_json` to read and write JSON
+- `io_flight` to read and write to Arrow's Flight protocol
+- `io_parquet` to read and write parquet
+- `io_parquet_compression` to read and write compressed parquet
+- `io_print` to write batches to formatted ASCII tables
+- `compute` to operate on arrays (addition, sum, sort, etc.)
+
+The feature `simd` (not part of `full`) produces more explicit SIMD instructions
+via [`std::simd`](https://doc.rust-lang.org/nightly/std/simd/index.html), but requires the
+nightly channel.
diff --git a/crates/nano-arrow/src/error.rs b/crates/nano-arrow/src/error.rs
new file mode 100644
index 000000000000..e6455d6f055d
--- /dev/null
+++ b/crates/nano-arrow/src/error.rs
@@ -0,0 +1,100 @@
+//! Defines [`Error`], representing all errors returned by this crate.
+use std::fmt::{Debug, Display, Formatter};
+
+/// Enum with all errors in this crate.
+#[derive(Debug)]
+#[non_exhaustive]
+pub enum Error {
+    /// Returned when functionality is not yet available.
+    NotYetImplemented(String),
+    /// Wrapper for an error triggered by a dependency
+    External(String, Box<dyn std::error::Error + Send + Sync>),
+    /// Wrapper for IO errors
+    Io(std::io::Error),
+    /// When an invalid argument is passed to a function.
+    InvalidArgumentError(String),
+    /// Error during import or export to/from a format
+    ExternalFormat(String),
+    /// Whenever pushing to a container fails because it does not support more entries.
+    /// The solution is usually to use a higher-capacity container-backing type.
+    Overflow,
+    /// Whenever incoming data from the C data interface, IPC or Flight does not fulfil the Arrow specification.
+    OutOfSpec(String),
+}
+
+impl Error {
+    /// Wraps an external error in an `Error`.
+    pub fn from_external_error(error: impl std::error::Error + Send + Sync + 'static) -> Self {
+        Self::External("".to_string(), Box::new(error))
+    }
+
+    pub(crate) fn oos<A: Into<String>>(msg: A) -> Self {
+        Self::OutOfSpec(msg.into())
+    }
+
+    #[allow(dead_code)]
+    pub(crate) fn nyi<A: Into<String>>(msg: A) -> Self {
+        Self::NotYetImplemented(msg.into())
+    }
+}
+
+impl From<::std::io::Error> for Error {
+    fn from(error: std::io::Error) -> Self {
+        Error::Io(error)
+    }
+}
+
+impl From<std::str::Utf8Error> for Error {
+    fn from(error: std::str::Utf8Error) -> Self {
+        Error::External("".to_string(), Box::new(error))
+    }
+}
+
+impl From<std::string::FromUtf8Error> for Error {
+    fn from(error: std::string::FromUtf8Error) -> Self {
+        Error::External("".to_string(), Box::new(error))
+    }
+}
+
+impl From<simdutf8::basic::Utf8Error> for Error {
+    fn from(error: simdutf8::basic::Utf8Error) -> Self {
+        Error::External("".to_string(), Box::new(error))
+    }
+}
+
+impl From<std::collections::TryReserveError> for Error {
+    fn from(_: std::collections::TryReserveError) -> Error {
+        Error::Overflow
+    }
+}
+
+impl Display for Error {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        match self {
+            Error::NotYetImplemented(source) => {
+                write!(f, "Not yet implemented: {}", &source)
+            },
+            Error::External(message, source) => {
+                write!(f, "External error{}: {}", message, &source)
+            },
+            Error::Io(desc) => write!(f, "Io error: {desc}"),
+            Error::InvalidArgumentError(desc) => {
+                write!(f, "Invalid argument error: {desc}")
+            },
+            Error::ExternalFormat(desc) => {
+                write!(f, "External format error: {desc}")
+            },
+            Error::Overflow => {
+                write!(f, "Operation overflew the backing container.")
+            },
+            Error::OutOfSpec(message) => {
+                write!(f, "{message}")
+            },
+        }
+    }
+}
+
+impl std::error::Error for Error {}
+
+/// Typedef for a [`std::result::Result`] of an [`Error`].
+pub type Result<T> = std::result::Result<T, Error>;
diff --git a/crates/nano-arrow/src/ffi/array.rs b/crates/nano-arrow/src/ffi/array.rs
new file mode 100644
index 000000000000..f87f7e66a10c
--- /dev/null
+++ b/crates/nano-arrow/src/ffi/array.rs
@@ -0,0 +1,568 @@
+//! Contains functionality to load an ArrayData from the C Data Interface
+use std::sync::Arc;
+
+use super::ArrowArray;
+use crate::array::*;
+use crate::bitmap::utils::{bytes_for, count_zeros};
+use crate::bitmap::Bitmap;
+use crate::buffer::{Buffer, Bytes, BytesAllocator};
+use crate::datatypes::{DataType, PhysicalType};
+use crate::error::{Error, Result};
+use crate::ffi::schema::get_child;
+use crate::types::NativeType;
+
+/// Reads a valid `ffi` interface into a `Box<dyn Array>`
+/// # Errors
+/// If and only if:
+/// * the interface is not valid (e.g. a null pointer)
+pub unsafe fn try_from<A: ArrowArrayRef>(array: A) -> Result<Box<dyn Array>> {
+    use PhysicalType::*;
+    Ok(match array.data_type().to_physical_type() {
+        Null => Box::new(NullArray::try_from_ffi(array)?),
+        Boolean => Box::new(BooleanArray::try_from_ffi(array)?),
+        Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+            Box::new(PrimitiveArray::<$T>::try_from_ffi(array)?)
+        }),
+        Utf8 => Box::new(Utf8Array::<i32>::try_from_ffi(array)?),
+        LargeUtf8 => Box::new(Utf8Array::<i64>::try_from_ffi(array)?),
+        Binary => Box::new(BinaryArray::<i32>::try_from_ffi(array)?),
+        LargeBinary => Box::new(BinaryArray::<i64>::try_from_ffi(array)?),
+        FixedSizeBinary => Box::new(FixedSizeBinaryArray::try_from_ffi(array)?),
+        List => Box::new(ListArray::<i32>::try_from_ffi(array)?),
+        LargeList => Box::new(ListArray::<i64>::try_from_ffi(array)?),
+        FixedSizeList => Box::new(FixedSizeListArray::try_from_ffi(array)?),
+        Struct => Box::new(StructArray::try_from_ffi(array)?),
+        Dictionary(key_type) => {
+            match_integer_type!(key_type, |$T| {
+                Box::new(DictionaryArray::<$T>::try_from_ffi(array)?)
+            })
+        },
+        Union => Box::new(UnionArray::try_from_ffi(array)?),
+        Map => Box::new(MapArray::try_from_ffi(array)?),
+    })
+}
+
+// Sound because the arrow specification does not allow multiple implementations
+// to change this struct
+// This is intrinsically impossible to prove because the implementations agree
+// on this as part of the Arrow specification
+unsafe impl Send for ArrowArray {}
+unsafe impl Sync for ArrowArray {}
+
+impl Drop for ArrowArray {
+    fn drop(&mut self) {
+        match self.release {
+            None => (),
+            Some(release) => unsafe { release(self) },
+        };
+    }
+}
+
+// callback used to drop [ArrowArray] when it is exported
+unsafe extern "C" fn c_release_array(array: *mut ArrowArray) {
+    if array.is_null() {
+        return;
+    }
+    let array = &mut *array;
+
+    // take ownership of `private_data`, therefore dropping it
+    let private = Box::from_raw(array.private_data as *mut PrivateData);
+    for child in private.children_ptr.iter() {
+        let _ = Box::from_raw(*child);
+    }
+
+    if let Some(ptr) = private.dictionary_ptr {
+        let _ = Box::from_raw(ptr);
+    }
+
+    array.release = None;
+}
+
+#[allow(dead_code)]
+struct PrivateData {
+    array: Box<dyn Array>,
+    buffers_ptr: Box<[*const std::os::raw::c_void]>,
+    children_ptr: Box<[*mut ArrowArray]>,
+    dictionary_ptr: Option<*mut ArrowArray>,
+}
+
+impl ArrowArray {
+    /// creates a new `ArrowArray` from existing data.
+    /// # Safety
+    /// This method releases `buffers`. Consumers of this struct *must* call `release` before
+    /// releasing this struct, or contents in `buffers` leak.
+    pub(crate) fn new(array: Box<dyn Array>) -> Self {
+        let (offset, buffers, children, dictionary) =
+            offset_buffers_children_dictionary(array.as_ref());
+
+        let buffers_ptr = buffers
+            .iter()
+            .map(|maybe_buffer| match maybe_buffer {
+                Some(b) => *b as *const std::os::raw::c_void,
+                None => std::ptr::null(),
+            })
+            .collect::<Box<[_]>>();
+        let n_buffers = buffers.len() as i64;
+
+        let children_ptr = children
+            .into_iter()
+            .map(|child| Box::into_raw(Box::new(ArrowArray::new(child))))
+            .collect::<Box<_>>();
+        let n_children = children_ptr.len() as i64;
+
+        let dictionary_ptr =
+            dictionary.map(|array| Box::into_raw(Box::new(ArrowArray::new(array))));
+
+        let length = array.len() as i64;
+        let null_count = array.null_count() as i64;
+
+        let mut private_data = Box::new(PrivateData {
+            array,
+            buffers_ptr,
+            children_ptr,
+            dictionary_ptr,
+        });
+
+        Self {
+            length,
+            null_count,
+            offset: offset as i64,
+            n_buffers,
+            n_children,
+            buffers: private_data.buffers_ptr.as_mut_ptr(),
+            children: private_data.children_ptr.as_mut_ptr(),
+            dictionary: private_data.dictionary_ptr.unwrap_or(std::ptr::null_mut()),
+            release: Some(c_release_array),
+            private_data: Box::into_raw(private_data) as *mut ::std::os::raw::c_void,
+        }
+    }
+
+    /// creates an empty [`ArrowArray`], which can be used to import data into
+    pub fn empty() -> Self {
+        Self {
+            length: 0,
+            null_count: 0,
+            offset: 0,
+            n_buffers: 0,
+            n_children: 0,
+            buffers: std::ptr::null_mut(),
+            children: std::ptr::null_mut(),
+            dictionary: std::ptr::null_mut(),
+            release: None,
+            private_data: std::ptr::null_mut(),
+        }
+    }
+
+    /// the length of the array
+    pub(crate) fn len(&self) -> usize {
+        self.length as usize
+    }
+
+    /// the offset of the array
+    pub(crate) fn offset(&self) -> usize {
+        self.offset as usize
+    }
+
+    /// the null count of the array
+    pub(crate) fn null_count(&self) -> usize {
+        self.null_count as usize
+    }
+}
+
+/// # Safety
+/// The caller must ensure that the buffer at index `i` is not mutably shared.
+unsafe fn get_buffer_ptr<T: NativeType>(
+    array: &ArrowArray,
+    data_type: &DataType,
+    index: usize,
+) -> Result<*mut T> {
+    if array.buffers.is_null() {
+        return Err(Error::oos(format!(
+            "An ArrowArray of type {data_type:?} must have non-null buffers"
+        )));
+    }
+
+    if array
+        .buffers
+        .align_offset(std::mem::align_of::<*mut *const u8>())
+        != 0
+    {
+        return Err(Error::oos(format!(
+            "An ArrowArray of type {data_type:?}
+            must have buffer {index} aligned to type {}",
+            std::any::type_name::<*mut *const u8>()
+        )));
+    }
+    let buffers = array.buffers as *mut *const u8;
+
+    if index >= array.n_buffers as usize {
+        return Err(Error::oos(format!(
+            "An ArrowArray of type {data_type:?} 
+             must have buffer {index}."
+        )));
+    }
+
+    let ptr = *buffers.add(index);
+    if ptr.is_null() {
+        return Err(Error::oos(format!(
+            "An array of type {data_type:?} 
+            must have a non-null buffer {index}"
+        )));
+    }
+
+    // note: we can't prove that this pointer is not mutably shared - part of the safety invariant
+    Ok(ptr as *mut T)
+}
+
+/// returns the buffer `i` of `array` interpreted as a [`Buffer`].
+/// # Safety
+/// This function is safe iff:
+/// * the buffers up to position `index` are valid for the declared length
+/// * the buffers' pointers are not mutably shared for the lifetime of `owner`
+unsafe fn create_buffer<T: NativeType>(
+    array: &ArrowArray,
+    data_type: &DataType,
+    owner: InternalArrowArray,
+    index: usize,
+) -> Result<Buffer<T>> {
+    let len = buffer_len(array, data_type, index)?;
+
+    if len == 0 {
+        return Ok(Buffer::new());
+    }
+
+    let offset = buffer_offset(array, data_type, index);
+    let ptr: *mut T = get_buffer_ptr(array, data_type, index)?;
+
+    // We have to check alignment.
+    // This is the zero-copy path.
+    if ptr.align_offset(std::mem::align_of::<T>()) == 0 {
+        let bytes = Bytes::from_foreign(ptr, len, BytesAllocator::InternalArrowArray(owner));
+        Ok(Buffer::from_bytes(bytes).sliced(offset, len - offset))
+    }
+    // This is the path where alignment isn't correct.
+    // We copy the data to a new vec
+    else {
+        let buf = std::slice::from_raw_parts(ptr, len - offset).to_vec();
+        Ok(Buffer::from(buf))
+    }
+}
+
+/// returns the buffer `i` of `array` interpreted as a [`Bitmap`].
+/// # Safety
+/// This function is safe iff:
+/// * the buffer at position `index` is valid for the declared length
+/// * the buffers' pointer is not mutable for the lifetime of `owner`
+unsafe fn create_bitmap(
+    array: &ArrowArray,
+    data_type: &DataType,
+    owner: InternalArrowArray,
+    index: usize,
+    // if this is the validity bitmap
+    // we can use the null count directly
+    is_validity: bool,
+) -> Result<Bitmap> {
+    let len: usize = array.length.try_into().expect("length to fit in `usize`");
+    if len == 0 {
+        return Ok(Bitmap::new());
+    }
+    let ptr = get_buffer_ptr(array, data_type, index)?;
+
+    // Pointer of u8 has alignment 1, so we don't have to check alignment.
+
+    let offset: usize = array.offset.try_into().expect("offset to fit in `usize`");
+    let bytes_len = bytes_for(offset + len);
+    let bytes = Bytes::from_foreign(ptr, bytes_len, BytesAllocator::InternalArrowArray(owner));
+
+    let null_count: usize = if is_validity {
+        array.null_count()
+    } else {
+        count_zeros(bytes.as_ref(), offset, len)
+    };
+    Bitmap::from_inner(Arc::new(bytes), offset, len, null_count)
+}
+
+fn buffer_offset(array: &ArrowArray, data_type: &DataType, i: usize) -> usize {
+    use PhysicalType::*;
+    match (data_type.to_physical_type(), i) {
+        (LargeUtf8, 2) | (LargeBinary, 2) | (Utf8, 2) | (Binary, 2) => 0,
+        (FixedSizeBinary, 1) => {
+            if let DataType::FixedSizeBinary(size) = data_type.to_logical_type() {
+                let offset: usize = array.offset.try_into().expect("Offset to fit in `usize`");
+                offset * *size
+            } else {
+                unreachable!()
+            }
+        },
+        _ => array.offset.try_into().expect("Offset to fit in `usize`"),
+    }
+}
+
+/// Returns the length, in slots, of the buffer `i` (indexed according to the C data interface)
+unsafe fn buffer_len(array: &ArrowArray, data_type: &DataType, i: usize) -> Result<usize> {
+    Ok(match (data_type.to_physical_type(), i) {
+        (PhysicalType::FixedSizeBinary, 1) => {
+            if let DataType::FixedSizeBinary(size) = data_type.to_logical_type() {
+                *size * (array.offset as usize + array.length as usize)
+            } else {
+                unreachable!()
+            }
+        },
+        (PhysicalType::FixedSizeList, 1) => {
+            if let DataType::FixedSizeList(_, size) = data_type.to_logical_type() {
+                *size * (array.offset as usize + array.length as usize)
+            } else {
+                unreachable!()
+            }
+        },
+        (PhysicalType::Utf8, 1)
+        | (PhysicalType::LargeUtf8, 1)
+        | (PhysicalType::Binary, 1)
+        | (PhysicalType::LargeBinary, 1)
+        | (PhysicalType::List, 1)
+        | (PhysicalType::LargeList, 1)
+        | (PhysicalType::Map, 1) => {
+            // the len of the offset buffer (buffer 1) equals length + 1
+            array.offset as usize + array.length as usize + 1
+        },
+        (PhysicalType::Utf8, 2) | (PhysicalType::Binary, 2) => {
+            // the len of the data buffer (buffer 2) equals the last value of the offset buffer (buffer 1)
+            let len = buffer_len(array, data_type, 1)?;
+            // first buffer is the null buffer => add(1)
+            let offset_buffer = unsafe { *(array.buffers as *mut *const u8).add(1) };
+            // interpret as i32
+            let offset_buffer = offset_buffer as *const i32;
+            // get last offset
+
+            (unsafe { *offset_buffer.add(len - 1) }) as usize
+        },
+        (PhysicalType::LargeUtf8, 2) | (PhysicalType::LargeBinary, 2) => {
+            // the len of the data buffer (buffer 2) equals the last value of the offset buffer (buffer 1)
+            let len = buffer_len(array, data_type, 1)?;
+            // first buffer is the null buffer => add(1)
+            let offset_buffer = unsafe { *(array.buffers as *mut *const u8).add(1) };
+            // interpret as i64
+            let offset_buffer = offset_buffer as *const i64;
+            // get last offset
+            (unsafe { *offset_buffer.add(len - 1) }) as usize
+        },
+        // buffer len of primitive types
+        _ => array.offset as usize + array.length as usize,
+    })
+}
+
+/// Safety
+/// This function is safe iff:
+/// * `array.children` at `index` is valid
+/// * `array.children` is not mutably shared for the lifetime of `parent`
+/// * the pointer of `array.children` at `index` is valid
+/// * the pointer of `array.children` at `index` is not mutably shared for the lifetime of `parent`
+unsafe fn create_child(
+    array: &ArrowArray,
+    data_type: &DataType,
+    parent: InternalArrowArray,
+    index: usize,
+) -> Result<ArrowArrayChild<'static>> {
+    let data_type = get_child(data_type, index)?;
+
+    // catch what we can
+    if array.children.is_null() {
+        return Err(Error::oos(format!(
+            "An ArrowArray of type {data_type:?} must have non-null children"
+        )));
+    }
+
+    if index >= array.n_children as usize {
+        return Err(Error::oos(format!(
+            "An ArrowArray of type {data_type:?} 
+             must have child {index}."
+        )));
+    }
+
+    // Safety - part of the invariant
+    let arr_ptr = unsafe { *array.children.add(index) };
+
+    // catch what we can
+    if arr_ptr.is_null() {
+        return Err(Error::oos(format!(
+            "An array of type {data_type:?}
+            must have a non-null child {index}"
+        )));
+    }
+
+    // Safety - invariant of this function
+    let arr_ptr = unsafe { &*arr_ptr };
+    Ok(ArrowArrayChild::new(arr_ptr, data_type, parent))
+}
+
+/// Safety
+/// This function is safe iff:
+/// * `array.dictionary` is valid
+/// * `array.dictionary` is not mutably shared for the lifetime of `parent`
+unsafe fn create_dictionary(
+    array: &ArrowArray,
+    data_type: &DataType,
+    parent: InternalArrowArray,
+) -> Result<Option<ArrowArrayChild<'static>>> {
+    if let DataType::Dictionary(_, values, _) = data_type {
+        let data_type = values.as_ref().clone();
+        // catch what we can
+        if array.dictionary.is_null() {
+            return Err(Error::oos(format!(
+                "An array of type {data_type:?}
+                must have a non-null dictionary"
+            )));
+        }
+
+        // safety: part of the invariant
+        let array = unsafe { &*array.dictionary };
+        Ok(Some(ArrowArrayChild::new(array, data_type, parent)))
+    } else {
+        Ok(None)
+    }
+}
+
+pub trait ArrowArrayRef: std::fmt::Debug {
+    fn owner(&self) -> InternalArrowArray {
+        (*self.parent()).clone()
+    }
+
+    /// returns the null bit buffer.
+    /// Rust implementation uses a buffer that is not part of the array of buffers.
+    /// The C Data interface's null buffer is part of the array of buffers.
+    /// # Safety
+    /// The caller must guarantee that the buffer `index` corresponds to a bitmap.
+    /// This function assumes that the bitmap created from FFI is valid; this is impossible to prove.
+    unsafe fn validity(&self) -> Result<Option<Bitmap>> {
+        if self.array().null_count() == 0 {
+            Ok(None)
+        } else {
+            create_bitmap(self.array(), self.data_type(), self.owner(), 0, true).map(Some)
+        }
+    }
+
+    /// # Safety
+    /// The caller must guarantee that the buffer `index` corresponds to a buffer.
+    /// This function assumes that the buffer created from FFI is valid; this is impossible to prove.
+    unsafe fn buffer<T: NativeType>(&self, index: usize) -> Result<Buffer<T>> {
+        create_buffer::<T>(self.array(), self.data_type(), self.owner(), index)
+    }
+
+    /// # Safety
+    /// This function is safe iff:
+    /// * the buffer at position `index` is valid for the declared length
+    /// * the buffers' pointer is not mutable for the lifetime of `owner`
+    unsafe fn bitmap(&self, index: usize) -> Result<Bitmap> {
+        create_bitmap(self.array(), self.data_type(), self.owner(), index, false)
+    }
+
+    /// # Safety
+    /// * `array.children` at `index` is valid
+    /// * `array.children` is not mutably shared for the lifetime of `parent`
+    /// * the pointer of `array.children` at `index` is valid
+    /// * the pointer of `array.children` at `index` is not mutably shared for the lifetime of `parent`
+    unsafe fn child(&self, index: usize) -> Result<ArrowArrayChild> {
+        create_child(self.array(), self.data_type(), self.parent().clone(), index)
+    }
+
+    unsafe fn dictionary(&self) -> Result<Option<ArrowArrayChild>> {
+        create_dictionary(self.array(), self.data_type(), self.parent().clone())
+    }
+
+    fn n_buffers(&self) -> usize;
+
+    fn parent(&self) -> &InternalArrowArray;
+    fn array(&self) -> &ArrowArray;
+    fn data_type(&self) -> &DataType;
+}
+
+/// Struct used to move an Array from and to the C Data Interface.
+/// Its main responsibility is to expose functionality that requires
+/// both [ArrowArray] and [ArrowSchema].
+///
+/// This struct has two main paths:
+///
+/// ## Import from the C Data Interface
+/// * [InternalArrowArray::empty] to allocate memory to be filled by an external call
+/// * [InternalArrowArray::try_from_raw] to consume two non-null allocated pointers
+/// ## Export to the C Data Interface
+/// * [InternalArrowArray::try_new] to create a new [InternalArrowArray] from Rust-specific information
+/// * [InternalArrowArray::into_raw] to expose two pointers for [ArrowArray] and [ArrowSchema].
+///
+/// # Safety
+/// Whoever creates this struct is responsible for releasing their resources. Specifically,
+/// consumers *must* call [InternalArrowArray::into_raw] and take ownership of the individual pointers,
+/// calling [ArrowArray::release] and [ArrowSchema::release] accordingly.
+///
+/// Furthermore, this struct assumes that the incoming data agrees with the C data interface.
+#[derive(Debug, Clone)]
+pub struct InternalArrowArray {
+    // Arc is used for sharability since this is immutable
+    array: Arc<ArrowArray>,
+    // Arced to reduce cost of cloning
+    data_type: Arc<DataType>,
+}
+
+impl InternalArrowArray {
+    pub fn new(array: ArrowArray, data_type: DataType) -> Self {
+        Self {
+            array: Arc::new(array),
+            data_type: Arc::new(data_type),
+        }
+    }
+}
+
+impl ArrowArrayRef for InternalArrowArray {
+    /// the data_type as declared in the schema
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    fn parent(&self) -> &InternalArrowArray {
+        self
+    }
+
+    fn array(&self) -> &ArrowArray {
+        self.array.as_ref()
+    }
+
+    fn n_buffers(&self) -> usize {
+        self.array.n_buffers as usize
+    }
+}
+
+#[derive(Debug)]
+pub struct ArrowArrayChild<'a> {
+    array: &'a ArrowArray,
+    data_type: DataType,
+    parent: InternalArrowArray,
+}
+
+impl<'a> ArrowArrayRef for ArrowArrayChild<'a> {
+    /// the data_type as declared in the schema
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    fn parent(&self) -> &InternalArrowArray {
+        &self.parent
+    }
+
+    fn array(&self) -> &ArrowArray {
+        self.array
+    }
+
+    fn n_buffers(&self) -> usize {
+        self.array.n_buffers as usize
+    }
+}
+
+impl<'a> ArrowArrayChild<'a> {
+    fn new(array: &'a ArrowArray, data_type: DataType, parent: InternalArrowArray) -> Self {
+        Self {
+            array,
+            data_type,
+            parent,
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/ffi/bridge.rs b/crates/nano-arrow/src/ffi/bridge.rs
new file mode 100644
index 000000000000..7a7b9a86ca3a
--- /dev/null
+++ b/crates/nano-arrow/src/ffi/bridge.rs
@@ -0,0 +1,39 @@
+use crate::array::*;
+
+macro_rules! ffi_dyn {
+    ($array:expr, $ty:ty) => {{
+        let a = $array.as_any().downcast_ref::<$ty>().unwrap();
+        if a.offset().is_some() {
+            $array
+        } else {
+            Box::new(a.to_ffi_aligned())
+        }
+    }};
+}
+
+pub fn align_to_c_data_interface(array: Box<dyn Array>) -> Box<dyn Array> {
+    use crate::datatypes::PhysicalType::*;
+    match array.data_type().to_physical_type() {
+        Null => ffi_dyn!(array, NullArray),
+        Boolean => ffi_dyn!(array, BooleanArray),
+        Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+            ffi_dyn!(array, PrimitiveArray<$T>)
+        }),
+        Binary => ffi_dyn!(array, BinaryArray<i32>),
+        LargeBinary => ffi_dyn!(array, BinaryArray<i64>),
+        FixedSizeBinary => ffi_dyn!(array, FixedSizeBinaryArray),
+        Utf8 => ffi_dyn!(array, Utf8Array::<i32>),
+        LargeUtf8 => ffi_dyn!(array, Utf8Array::<i64>),
+        List => ffi_dyn!(array, ListArray::<i32>),
+        LargeList => ffi_dyn!(array, ListArray::<i64>),
+        FixedSizeList => ffi_dyn!(array, FixedSizeListArray),
+        Struct => ffi_dyn!(array, StructArray),
+        Union => ffi_dyn!(array, UnionArray),
+        Map => ffi_dyn!(array, MapArray),
+        Dictionary(key_type) => {
+            match_integer_type!(key_type, |$T| {
+                ffi_dyn!(array, DictionaryArray<$T>)
+            })
+        },
+    }
+}
diff --git a/crates/nano-arrow/src/ffi/generated.rs b/crates/nano-arrow/src/ffi/generated.rs
new file mode 100644
index 000000000000..cd4953b7198a
--- /dev/null
+++ b/crates/nano-arrow/src/ffi/generated.rs
@@ -0,0 +1,55 @@
+/* automatically generated by rust-bindgen 0.59.2 */
+
+/// ABI-compatible struct for [`ArrowSchema`](https://arrow.apache.org/docs/format/CDataInterface.html#structure-definitions)
+#[repr(C)]
+#[derive(Debug)]
+pub struct ArrowSchema {
+    pub(super) format: *const ::std::os::raw::c_char,
+    pub(super) name: *const ::std::os::raw::c_char,
+    pub(super) metadata: *const ::std::os::raw::c_char,
+    pub(super) flags: i64,
+    pub(super) n_children: i64,
+    pub(super) children: *mut *mut ArrowSchema,
+    pub(super) dictionary: *mut ArrowSchema,
+    pub(super) release: ::std::option::Option<unsafe extern "C" fn(arg1: *mut ArrowSchema)>,
+    pub(super) private_data: *mut ::std::os::raw::c_void,
+}
+
+/// ABI-compatible struct for [`ArrowArray`](https://arrow.apache.org/docs/format/CDataInterface.html#structure-definitions)
+#[repr(C)]
+#[derive(Debug)]
+pub struct ArrowArray {
+    pub(super) length: i64,
+    pub(super) null_count: i64,
+    pub(super) offset: i64,
+    pub(super) n_buffers: i64,
+    pub(super) n_children: i64,
+    pub(super) buffers: *mut *const ::std::os::raw::c_void,
+    pub(super) children: *mut *mut ArrowArray,
+    pub(super) dictionary: *mut ArrowArray,
+    pub(super) release: ::std::option::Option<unsafe extern "C" fn(arg1: *mut ArrowArray)>,
+    pub(super) private_data: *mut ::std::os::raw::c_void,
+}
+
+/// ABI-compatible struct for [`ArrowArrayStream`](https://arrow.apache.org/docs/format/CStreamInterface.html).
+#[repr(C)]
+#[derive(Debug)]
+pub struct ArrowArrayStream {
+    pub(super) get_schema: ::std::option::Option<
+        unsafe extern "C" fn(
+            arg1: *mut ArrowArrayStream,
+            out: *mut ArrowSchema,
+        ) -> ::std::os::raw::c_int,
+    >,
+    pub(super) get_next: ::std::option::Option<
+        unsafe extern "C" fn(
+            arg1: *mut ArrowArrayStream,
+            out: *mut ArrowArray,
+        ) -> ::std::os::raw::c_int,
+    >,
+    pub(super) get_last_error: ::std::option::Option<
+        unsafe extern "C" fn(arg1: *mut ArrowArrayStream) -> *const ::std::os::raw::c_char,
+    >,
+    pub(super) release: ::std::option::Option<unsafe extern "C" fn(arg1: *mut ArrowArrayStream)>,
+    pub(super) private_data: *mut ::std::os::raw::c_void,
+}
diff --git a/crates/nano-arrow/src/ffi/mmap.rs b/crates/nano-arrow/src/ffi/mmap.rs
new file mode 100644
index 000000000000..03c1ac9aa30a
--- /dev/null
+++ b/crates/nano-arrow/src/ffi/mmap.rs
@@ -0,0 +1,164 @@
+//! Functionality to mmap in-memory data regions.
+use std::sync::Arc;
+
+use super::{ArrowArray, InternalArrowArray};
+use crate::array::{BooleanArray, FromFfi, PrimitiveArray};
+use crate::datatypes::DataType;
+use crate::error::Error;
+use crate::types::NativeType;
+
+#[allow(dead_code)]
+struct PrivateData<T> {
+    // the owner of the pointers' regions
+    data: T,
+    buffers_ptr: Box<[*const std::os::raw::c_void]>,
+    children_ptr: Box<[*mut ArrowArray]>,
+    dictionary_ptr: Option<*mut ArrowArray>,
+}
+
+pub(crate) unsafe fn create_array<
+    T: AsRef<[u8]>,
+    I: Iterator<Item = Option<*const u8>>,
+    II: Iterator<Item = ArrowArray>,
+>(
+    data: Arc<T>,
+    num_rows: usize,
+    null_count: usize,
+    buffers: I,
+    children: II,
+    dictionary: Option<ArrowArray>,
+    offset: Option<usize>,
+) -> ArrowArray {
+    let buffers_ptr = buffers
+        .map(|maybe_buffer| match maybe_buffer {
+            Some(b) => b as *const std::os::raw::c_void,
+            None => std::ptr::null(),
+        })
+        .collect::<Box<[_]>>();
+    let n_buffers = buffers_ptr.len() as i64;
+
+    let children_ptr = children
+        .map(|child| Box::into_raw(Box::new(child)))
+        .collect::<Box<_>>();
+    let n_children = children_ptr.len() as i64;
+
+    let dictionary_ptr = dictionary.map(|array| Box::into_raw(Box::new(array)));
+
+    let mut private_data = Box::new(PrivateData::<Arc<T>> {
+        data,
+        buffers_ptr,
+        children_ptr,
+        dictionary_ptr,
+    });
+
+    ArrowArray {
+        length: num_rows as i64,
+        null_count: null_count as i64,
+        offset: offset.unwrap_or(0) as i64, // Unwrap: IPC files are by definition not offset
+        n_buffers,
+        n_children,
+        buffers: private_data.buffers_ptr.as_mut_ptr(),
+        children: private_data.children_ptr.as_mut_ptr(),
+        dictionary: private_data.dictionary_ptr.unwrap_or(std::ptr::null_mut()),
+        release: Some(release::<Arc<T>>),
+        private_data: Box::into_raw(private_data) as *mut ::std::os::raw::c_void,
+    }
+}
+
+/// callback used to drop [`ArrowArray`] when it is exported specified for [`PrivateData`].
+unsafe extern "C" fn release<T>(array: *mut ArrowArray) {
+    if array.is_null() {
+        return;
+    }
+    let array = &mut *array;
+
+    // take ownership of `private_data`, therefore dropping it
+    let private = Box::from_raw(array.private_data as *mut PrivateData<T>);
+    for child in private.children_ptr.iter() {
+        let _ = Box::from_raw(*child);
+    }
+
+    if let Some(ptr) = private.dictionary_ptr {
+        let _ = Box::from_raw(ptr);
+    }
+
+    array.release = None;
+}
+
+/// Creates a (non-null) [`PrimitiveArray`] from a slice of values.
+/// This does not have memcopy and is the fastest way to create a [`PrimitiveArray`].
+///
+/// This can be useful if you want to apply arrow kernels on slices without incurring
+/// a memcopy cost.
+///
+/// # Safety
+///
+/// Using this function is not unsafe, but the returned PrimitiveArray's lifetime is bound to the lifetime
+/// of the slice. The returned [`PrimitiveArray`] _must not_ outlive the passed slice.
+pub unsafe fn slice<T: NativeType>(slice: &[T]) -> PrimitiveArray<T> {
+    let num_rows = slice.len();
+    let null_count = 0;
+    let validity = None;
+
+    let data: &[u8] = bytemuck::cast_slice(slice);
+    let ptr = data.as_ptr();
+    let data = Arc::new(data);
+
+    // safety: the underlying assumption of this function: the array will not be used
+    // beyond the
+    let array = create_array(
+        data,
+        num_rows,
+        null_count,
+        [validity, Some(ptr)].into_iter(),
+        [].into_iter(),
+        None,
+        None,
+    );
+    let array = InternalArrowArray::new(array, T::PRIMITIVE.into());
+
+    // safety: we just created a valid array
+    unsafe { PrimitiveArray::<T>::try_from_ffi(array) }.unwrap()
+}
+
+/// Creates a (non-null) [`BooleanArray`] from a slice of bits.
+/// This does not have memcopy and is the fastest way to create a [`BooleanArray`].
+///
+/// This can be useful if you want to apply arrow kernels on slices without incurring
+/// a memcopy cost.
+///
+/// The `offset` indicates where the first bit starts in the first byte.
+///
+/// # Safety
+///
+/// Using this function is not unsafe, but the returned BooleanArrays's lifetime is bound to the lifetime
+/// of the slice. The returned [`BooleanArray`] _must not_ outlive the passed slice.
+pub unsafe fn bitmap(data: &[u8], offset: usize, length: usize) -> Result<BooleanArray, Error> {
+    if offset >= 8 {
+        return Err(Error::InvalidArgumentError("offset should be < 8".into()));
+    };
+    if length > data.len() * 8 - offset {
+        return Err(Error::InvalidArgumentError("given length is oob".into()));
+    }
+    let null_count = 0;
+    let validity = None;
+
+    let ptr = data.as_ptr();
+    let data = Arc::new(data);
+
+    // safety: the underlying assumption of this function: the array will not be used
+    // beyond the
+    let array = create_array(
+        data,
+        length,
+        null_count,
+        [validity, Some(ptr)].into_iter(),
+        [].into_iter(),
+        None,
+        Some(offset),
+    );
+    let array = InternalArrowArray::new(array, DataType::Boolean);
+
+    // safety: we just created a valid array
+    Ok(unsafe { BooleanArray::try_from_ffi(array) }.unwrap())
+}
diff --git a/crates/nano-arrow/src/ffi/mod.rs b/crates/nano-arrow/src/ffi/mod.rs
new file mode 100644
index 000000000000..b1a1ac3c1210
--- /dev/null
+++ b/crates/nano-arrow/src/ffi/mod.rs
@@ -0,0 +1,46 @@
+//! contains FFI bindings to import and export [`Array`](crate::array::Array) via
+//! Arrow's [C Data Interface](https://arrow.apache.org/docs/format/CDataInterface.html)
+mod array;
+mod bridge;
+mod generated;
+pub mod mmap;
+mod schema;
+mod stream;
+
+pub(crate) use array::{try_from, ArrowArrayRef, InternalArrowArray};
+pub use generated::{ArrowArray, ArrowArrayStream, ArrowSchema};
+pub use stream::{export_iterator, ArrowArrayStreamReader};
+
+use self::schema::to_field;
+use crate::array::Array;
+use crate::datatypes::{DataType, Field};
+use crate::error::Result;
+
+/// Exports an [`Box<dyn Array>`] to the C data interface.
+pub fn export_array_to_c(array: Box<dyn Array>) -> ArrowArray {
+    ArrowArray::new(bridge::align_to_c_data_interface(array))
+}
+
+/// Exports a [`Field`] to the C data interface.
+pub fn export_field_to_c(field: &Field) -> ArrowSchema {
+    ArrowSchema::new(field)
+}
+
+/// Imports a [`Field`] from the C data interface.
+/// # Safety
+/// This function is intrinsically `unsafe` and relies on a [`ArrowSchema`]
+/// being valid according to the [C data interface](https://arrow.apache.org/docs/format/CDataInterface.html) (FFI).
+pub unsafe fn import_field_from_c(field: &ArrowSchema) -> Result<Field> {
+    to_field(field)
+}
+
+/// Imports an [`Array`] from the C data interface.
+/// # Safety
+/// This function is intrinsically `unsafe` and relies on a [`ArrowArray`]
+/// being valid according to the [C data interface](https://arrow.apache.org/docs/format/CDataInterface.html) (FFI).
+pub unsafe fn import_array_from_c(
+    array: ArrowArray,
+    data_type: DataType,
+) -> Result<Box<dyn Array>> {
+    try_from(InternalArrowArray::new(array, data_type))
+}
diff --git a/crates/nano-arrow/src/ffi/schema.rs b/crates/nano-arrow/src/ffi/schema.rs
new file mode 100644
index 000000000000..332410b0b6c5
--- /dev/null
+++ b/crates/nano-arrow/src/ffi/schema.rs
@@ -0,0 +1,633 @@
+use std::collections::BTreeMap;
+use std::convert::TryInto;
+use std::ffi::{CStr, CString};
+use std::ptr;
+
+use super::ArrowSchema;
+use crate::datatypes::{
+    DataType, Extension, Field, IntegerType, IntervalUnit, Metadata, TimeUnit, UnionMode,
+};
+use crate::error::{Error, Result};
+
+#[allow(dead_code)]
+struct SchemaPrivateData {
+    name: CString,
+    format: CString,
+    metadata: Option<Vec<u8>>,
+    children_ptr: Box<[*mut ArrowSchema]>,
+    dictionary: Option<*mut ArrowSchema>,
+}
+
+// callback used to drop [ArrowSchema] when it is exported.
+unsafe extern "C" fn c_release_schema(schema: *mut ArrowSchema) {
+    if schema.is_null() {
+        return;
+    }
+    let schema = &mut *schema;
+
+    let private = Box::from_raw(schema.private_data as *mut SchemaPrivateData);
+    for child in private.children_ptr.iter() {
+        let _ = Box::from_raw(*child);
+    }
+
+    if let Some(ptr) = private.dictionary {
+        let _ = Box::from_raw(ptr);
+    }
+
+    schema.release = None;
+}
+
+/// allocate (and hold) the children
+fn schema_children(data_type: &DataType, flags: &mut i64) -> Box<[*mut ArrowSchema]> {
+    match data_type {
+        DataType::List(field) | DataType::FixedSizeList(field, _) | DataType::LargeList(field) => {
+            Box::new([Box::into_raw(Box::new(ArrowSchema::new(field.as_ref())))])
+        },
+        DataType::Map(field, is_sorted) => {
+            *flags += (*is_sorted as i64) * 4;
+            Box::new([Box::into_raw(Box::new(ArrowSchema::new(field.as_ref())))])
+        },
+        DataType::Struct(fields) | DataType::Union(fields, _, _) => fields
+            .iter()
+            .map(|field| Box::into_raw(Box::new(ArrowSchema::new(field))))
+            .collect::<Box<[_]>>(),
+        DataType::Extension(_, inner, _) => schema_children(inner, flags),
+        _ => Box::new([]),
+    }
+}
+
+impl ArrowSchema {
+    /// creates a new [ArrowSchema]
+    pub(crate) fn new(field: &Field) -> Self {
+        let format = to_format(field.data_type());
+        let name = field.name.clone();
+
+        let mut flags = field.is_nullable as i64 * 2;
+
+        // note: this cannot be done along with the above because the above is fallible and this op leaks.
+        let children_ptr = schema_children(field.data_type(), &mut flags);
+        let n_children = children_ptr.len() as i64;
+
+        let dictionary = if let DataType::Dictionary(_, values, is_ordered) = field.data_type() {
+            flags += *is_ordered as i64;
+            // we do not store field info in the dict values, so can't recover it all :(
+            let field = Field::new("", values.as_ref().clone(), true);
+            Some(Box::new(ArrowSchema::new(&field)))
+        } else {
+            None
+        };
+
+        let metadata = &field.metadata;
+
+        let metadata = if let DataType::Extension(name, _, extension_metadata) = field.data_type() {
+            // append extension information.
+            let mut metadata = metadata.clone();
+
+            // metadata
+            if let Some(extension_metadata) = extension_metadata {
+                metadata.insert(
+                    "ARROW:extension:metadata".to_string(),
+                    extension_metadata.clone(),
+                );
+            }
+
+            metadata.insert("ARROW:extension:name".to_string(), name.clone());
+
+            Some(metadata_to_bytes(&metadata))
+        } else if !metadata.is_empty() {
+            Some(metadata_to_bytes(metadata))
+        } else {
+            None
+        };
+
+        let name = CString::new(name).unwrap();
+        let format = CString::new(format).unwrap();
+
+        let mut private = Box::new(SchemaPrivateData {
+            name,
+            format,
+            metadata,
+            children_ptr,
+            dictionary: dictionary.map(Box::into_raw),
+        });
+
+        // <https://arrow.apache.org/docs/format/CDataInterface.html#c.ArrowSchema>
+        Self {
+            format: private.format.as_ptr(),
+            name: private.name.as_ptr(),
+            metadata: private
+                .metadata
+                .as_ref()
+                .map(|x| x.as_ptr())
+                .unwrap_or(std::ptr::null()) as *const ::std::os::raw::c_char,
+            flags,
+            n_children,
+            children: private.children_ptr.as_mut_ptr(),
+            dictionary: private.dictionary.unwrap_or(std::ptr::null_mut()),
+            release: Some(c_release_schema),
+            private_data: Box::into_raw(private) as *mut ::std::os::raw::c_void,
+        }
+    }
+
+    /// create an empty [ArrowSchema]
+    pub fn empty() -> Self {
+        Self {
+            format: std::ptr::null_mut(),
+            name: std::ptr::null_mut(),
+            metadata: std::ptr::null_mut(),
+            flags: 0,
+            n_children: 0,
+            children: ptr::null_mut(),
+            dictionary: std::ptr::null_mut(),
+            release: None,
+            private_data: std::ptr::null_mut(),
+        }
+    }
+
+    /// returns the format of this schema.
+    pub(crate) fn format(&self) -> &str {
+        assert!(!self.format.is_null());
+        // safe because the lifetime of `self.format` equals `self`
+        unsafe { CStr::from_ptr(self.format) }
+            .to_str()
+            .expect("The external API has a non-utf8 as format")
+    }
+
+    /// returns the name of this schema.
+    ///
+    /// Since this field is optional, `""` is returned if it is not set (as per the spec).
+    pub(crate) fn name(&self) -> &str {
+        if self.name.is_null() {
+            return "";
+        }
+        // safe because the lifetime of `self.name` equals `self`
+        unsafe { CStr::from_ptr(self.name) }.to_str().unwrap()
+    }
+
+    pub(crate) fn child(&self, index: usize) -> &'static Self {
+        assert!(index < self.n_children as usize);
+        unsafe { self.children.add(index).as_ref().unwrap().as_ref().unwrap() }
+    }
+
+    pub(crate) fn dictionary(&self) -> Option<&'static Self> {
+        if self.dictionary.is_null() {
+            return None;
+        };
+        Some(unsafe { self.dictionary.as_ref().unwrap() })
+    }
+
+    pub(crate) fn nullable(&self) -> bool {
+        (self.flags / 2) & 1 == 1
+    }
+}
+
+impl Drop for ArrowSchema {
+    fn drop(&mut self) {
+        match self.release {
+            None => (),
+            Some(release) => unsafe { release(self) },
+        };
+    }
+}
+
+pub(crate) unsafe fn to_field(schema: &ArrowSchema) -> Result<Field> {
+    let dictionary = schema.dictionary();
+    let data_type = if let Some(dictionary) = dictionary {
+        let indices = to_integer_type(schema.format())?;
+        let values = to_field(dictionary)?;
+        let is_ordered = schema.flags & 1 == 1;
+        DataType::Dictionary(indices, Box::new(values.data_type().clone()), is_ordered)
+    } else {
+        to_data_type(schema)?
+    };
+    let (metadata, extension) = unsafe { metadata_from_bytes(schema.metadata) };
+
+    let data_type = if let Some((name, extension_metadata)) = extension {
+        DataType::Extension(name, Box::new(data_type), extension_metadata)
+    } else {
+        data_type
+    };
+
+    Ok(Field::new(schema.name(), data_type, schema.nullable()).with_metadata(metadata))
+}
+
+fn to_integer_type(format: &str) -> Result<IntegerType> {
+    use IntegerType::*;
+    Ok(match format {
+        "c" => Int8,
+        "C" => UInt8,
+        "s" => Int16,
+        "S" => UInt16,
+        "i" => Int32,
+        "I" => UInt32,
+        "l" => Int64,
+        "L" => UInt64,
+        _ => {
+            return Err(Error::OutOfSpec(
+                "Dictionary indices can only be integers".to_string(),
+            ))
+        },
+    })
+}
+
+unsafe fn to_data_type(schema: &ArrowSchema) -> Result<DataType> {
+    Ok(match schema.format() {
+        "n" => DataType::Null,
+        "b" => DataType::Boolean,
+        "c" => DataType::Int8,
+        "C" => DataType::UInt8,
+        "s" => DataType::Int16,
+        "S" => DataType::UInt16,
+        "i" => DataType::Int32,
+        "I" => DataType::UInt32,
+        "l" => DataType::Int64,
+        "L" => DataType::UInt64,
+        "e" => DataType::Float16,
+        "f" => DataType::Float32,
+        "g" => DataType::Float64,
+        "z" => DataType::Binary,
+        "Z" => DataType::LargeBinary,
+        "u" => DataType::Utf8,
+        "U" => DataType::LargeUtf8,
+        "tdD" => DataType::Date32,
+        "tdm" => DataType::Date64,
+        "tts" => DataType::Time32(TimeUnit::Second),
+        "ttm" => DataType::Time32(TimeUnit::Millisecond),
+        "ttu" => DataType::Time64(TimeUnit::Microsecond),
+        "ttn" => DataType::Time64(TimeUnit::Nanosecond),
+        "tDs" => DataType::Duration(TimeUnit::Second),
+        "tDm" => DataType::Duration(TimeUnit::Millisecond),
+        "tDu" => DataType::Duration(TimeUnit::Microsecond),
+        "tDn" => DataType::Duration(TimeUnit::Nanosecond),
+        "tiM" => DataType::Interval(IntervalUnit::YearMonth),
+        "tiD" => DataType::Interval(IntervalUnit::DayTime),
+        "+l" => {
+            let child = schema.child(0);
+            DataType::List(Box::new(to_field(child)?))
+        },
+        "+L" => {
+            let child = schema.child(0);
+            DataType::LargeList(Box::new(to_field(child)?))
+        },
+        "+m" => {
+            let child = schema.child(0);
+
+            let is_sorted = (schema.flags & 4) != 0;
+            DataType::Map(Box::new(to_field(child)?), is_sorted)
+        },
+        "+s" => {
+            let children = (0..schema.n_children as usize)
+                .map(|x| to_field(schema.child(x)))
+                .collect::<Result<Vec<_>>>()?;
+            DataType::Struct(children)
+        },
+        other => {
+            match other.splitn(2, ':').collect::<Vec<_>>()[..] {
+                // Timestamps with no timezone
+                ["tss", ""] => DataType::Timestamp(TimeUnit::Second, None),
+                ["tsm", ""] => DataType::Timestamp(TimeUnit::Millisecond, None),
+                ["tsu", ""] => DataType::Timestamp(TimeUnit::Microsecond, None),
+                ["tsn", ""] => DataType::Timestamp(TimeUnit::Nanosecond, None),
+
+                // Timestamps with timezone
+                ["tss", tz] => DataType::Timestamp(TimeUnit::Second, Some(tz.to_string())),
+                ["tsm", tz] => DataType::Timestamp(TimeUnit::Millisecond, Some(tz.to_string())),
+                ["tsu", tz] => DataType::Timestamp(TimeUnit::Microsecond, Some(tz.to_string())),
+                ["tsn", tz] => DataType::Timestamp(TimeUnit::Nanosecond, Some(tz.to_string())),
+
+                ["w", size_raw] => {
+                    // Example: "w:42" fixed-width binary [42 bytes]
+                    let size = size_raw
+                        .parse::<usize>()
+                        .map_err(|_| Error::OutOfSpec("size is not a valid integer".to_string()))?;
+                    DataType::FixedSizeBinary(size)
+                },
+                ["+w", size_raw] => {
+                    // Example: "+w:123" fixed-sized list [123 items]
+                    let size = size_raw
+                        .parse::<usize>()
+                        .map_err(|_| Error::OutOfSpec("size is not a valid integer".to_string()))?;
+                    let child = to_field(schema.child(0))?;
+                    DataType::FixedSizeList(Box::new(child), size)
+                },
+                ["d", raw] => {
+                    // Decimal
+                    let (precision, scale) = match raw.split(',').collect::<Vec<_>>()[..] {
+                        [precision_raw, scale_raw] => {
+                            // Example: "d:19,10" decimal128 [precision 19, scale 10]
+                            (precision_raw, scale_raw)
+                        },
+                        [precision_raw, scale_raw, width_raw] => {
+                            // Example: "d:19,10,NNN" decimal bitwidth = NNN [precision 19, scale 10]
+                            // Only bitwdth of 128 currently supported
+                            let bit_width = width_raw.parse::<usize>().map_err(|_| {
+                                Error::OutOfSpec(
+                                    "Decimal bit width is not a valid integer".to_string(),
+                                )
+                            })?;
+                            if bit_width == 256 {
+                                return Ok(DataType::Decimal256(
+                                    precision_raw.parse::<usize>().map_err(|_| {
+                                        Error::OutOfSpec(
+                                            "Decimal precision is not a valid integer".to_string(),
+                                        )
+                                    })?,
+                                    scale_raw.parse::<usize>().map_err(|_| {
+                                        Error::OutOfSpec(
+                                            "Decimal scale is not a valid integer".to_string(),
+                                        )
+                                    })?,
+                                ));
+                            }
+                            (precision_raw, scale_raw)
+                        },
+                        _ => {
+                            return Err(Error::OutOfSpec(
+                                "Decimal must contain 2 or 3 comma-separated values".to_string(),
+                            ));
+                        },
+                    };
+
+                    DataType::Decimal(
+                        precision.parse::<usize>().map_err(|_| {
+                            Error::OutOfSpec("Decimal precision is not a valid integer".to_string())
+                        })?,
+                        scale.parse::<usize>().map_err(|_| {
+                            Error::OutOfSpec("Decimal scale is not a valid integer".to_string())
+                        })?,
+                    )
+                },
+                [union_type @ "+us", union_parts] | [union_type @ "+ud", union_parts] => {
+                    // union, sparse
+                    // Example "+us:I,J,..." sparse union with type ids I,J...
+                    // Example: "+ud:I,J,..." dense union with type ids I,J...
+                    let mode = UnionMode::sparse(union_type == "+us");
+                    let type_ids = union_parts
+                        .split(',')
+                        .map(|x| {
+                            x.parse::<i32>().map_err(|_| {
+                                Error::OutOfSpec("Union type id is not a valid integer".to_string())
+                            })
+                        })
+                        .collect::<Result<Vec<_>>>()?;
+                    let fields = (0..schema.n_children as usize)
+                        .map(|x| to_field(schema.child(x)))
+                        .collect::<Result<Vec<_>>>()?;
+                    DataType::Union(fields, Some(type_ids), mode)
+                },
+                _ => {
+                    return Err(Error::OutOfSpec(format!(
+                        "The datatype \"{other}\" is still not supported in Rust implementation",
+                    )));
+                },
+            }
+        },
+    })
+}
+
+/// the inverse of [to_field]
+fn to_format(data_type: &DataType) -> String {
+    match data_type {
+        DataType::Null => "n".to_string(),
+        DataType::Boolean => "b".to_string(),
+        DataType::Int8 => "c".to_string(),
+        DataType::UInt8 => "C".to_string(),
+        DataType::Int16 => "s".to_string(),
+        DataType::UInt16 => "S".to_string(),
+        DataType::Int32 => "i".to_string(),
+        DataType::UInt32 => "I".to_string(),
+        DataType::Int64 => "l".to_string(),
+        DataType::UInt64 => "L".to_string(),
+        DataType::Float16 => "e".to_string(),
+        DataType::Float32 => "f".to_string(),
+        DataType::Float64 => "g".to_string(),
+        DataType::Binary => "z".to_string(),
+        DataType::LargeBinary => "Z".to_string(),
+        DataType::Utf8 => "u".to_string(),
+        DataType::LargeUtf8 => "U".to_string(),
+        DataType::Date32 => "tdD".to_string(),
+        DataType::Date64 => "tdm".to_string(),
+        DataType::Time32(TimeUnit::Second) => "tts".to_string(),
+        DataType::Time32(TimeUnit::Millisecond) => "ttm".to_string(),
+        DataType::Time32(_) => {
+            unreachable!("Time32 is only supported for seconds and milliseconds")
+        },
+        DataType::Time64(TimeUnit::Microsecond) => "ttu".to_string(),
+        DataType::Time64(TimeUnit::Nanosecond) => "ttn".to_string(),
+        DataType::Time64(_) => {
+            unreachable!("Time64 is only supported for micro and nanoseconds")
+        },
+        DataType::Duration(TimeUnit::Second) => "tDs".to_string(),
+        DataType::Duration(TimeUnit::Millisecond) => "tDm".to_string(),
+        DataType::Duration(TimeUnit::Microsecond) => "tDu".to_string(),
+        DataType::Duration(TimeUnit::Nanosecond) => "tDn".to_string(),
+        DataType::Interval(IntervalUnit::YearMonth) => "tiM".to_string(),
+        DataType::Interval(IntervalUnit::DayTime) => "tiD".to_string(),
+        DataType::Interval(IntervalUnit::MonthDayNano) => {
+            todo!("Spec for FFI for MonthDayNano still not defined.")
+        },
+        DataType::Timestamp(unit, tz) => {
+            let unit = match unit {
+                TimeUnit::Second => "s",
+                TimeUnit::Millisecond => "m",
+                TimeUnit::Microsecond => "u",
+                TimeUnit::Nanosecond => "n",
+            };
+            format!(
+                "ts{}:{}",
+                unit,
+                tz.as_ref().map(|x| x.as_ref()).unwrap_or("")
+            )
+        },
+        DataType::Decimal(precision, scale) => format!("d:{precision},{scale}"),
+        DataType::Decimal256(precision, scale) => format!("d:{precision},{scale},256"),
+        DataType::List(_) => "+l".to_string(),
+        DataType::LargeList(_) => "+L".to_string(),
+        DataType::Struct(_) => "+s".to_string(),
+        DataType::FixedSizeBinary(size) => format!("w:{size}"),
+        DataType::FixedSizeList(_, size) => format!("+w:{size}"),
+        DataType::Union(f, ids, mode) => {
+            let sparsness = if mode.is_sparse() { 's' } else { 'd' };
+            let mut r = format!("+u{sparsness}:");
+            let ids = if let Some(ids) = ids {
+                ids.iter()
+                    .fold(String::new(), |a, b| a + &b.to_string() + ",")
+            } else {
+                (0..f.len()).fold(String::new(), |a, b| a + &b.to_string() + ",")
+            };
+            let ids = &ids[..ids.len() - 1]; // take away last ","
+            r.push_str(ids);
+            r
+        },
+        DataType::Map(_, _) => "+m".to_string(),
+        DataType::Dictionary(index, _, _) => to_format(&(*index).into()),
+        DataType::Extension(_, inner, _) => to_format(inner.as_ref()),
+    }
+}
+
+pub(super) fn get_child(data_type: &DataType, index: usize) -> Result<DataType> {
+    match (index, data_type) {
+        (0, DataType::List(field)) => Ok(field.data_type().clone()),
+        (0, DataType::FixedSizeList(field, _)) => Ok(field.data_type().clone()),
+        (0, DataType::LargeList(field)) => Ok(field.data_type().clone()),
+        (0, DataType::Map(field, _)) => Ok(field.data_type().clone()),
+        (index, DataType::Struct(fields)) => Ok(fields[index].data_type().clone()),
+        (index, DataType::Union(fields, _, _)) => Ok(fields[index].data_type().clone()),
+        (index, DataType::Extension(_, subtype, _)) => get_child(subtype, index),
+        (child, data_type) => Err(Error::OutOfSpec(format!(
+            "Requested child {child} to type {data_type:?} that has no such child",
+        ))),
+    }
+}
+
+fn metadata_to_bytes(metadata: &BTreeMap<String, String>) -> Vec<u8> {
+    let a = (metadata.len() as i32).to_ne_bytes().to_vec();
+    metadata.iter().fold(a, |mut acc, (key, value)| {
+        acc.extend((key.len() as i32).to_ne_bytes());
+        acc.extend(key.as_bytes());
+        acc.extend((value.len() as i32).to_ne_bytes());
+        acc.extend(value.as_bytes());
+        acc
+    })
+}
+
+unsafe fn read_ne_i32(ptr: *const u8) -> i32 {
+    let slice = std::slice::from_raw_parts(ptr, 4);
+    i32::from_ne_bytes(slice.try_into().unwrap())
+}
+
+unsafe fn read_bytes(ptr: *const u8, len: usize) -> &'static str {
+    let slice = std::slice::from_raw_parts(ptr, len);
+    simdutf8::basic::from_utf8(slice).unwrap()
+}
+
+unsafe fn metadata_from_bytes(data: *const ::std::os::raw::c_char) -> (Metadata, Extension) {
+    let mut data = data as *const u8; // u8 = i8
+    if data.is_null() {
+        return (Metadata::default(), None);
+    };
+    let len = read_ne_i32(data);
+    data = data.add(4);
+
+    let mut result = BTreeMap::new();
+    let mut extension_name = None;
+    let mut extension_metadata = None;
+    for _ in 0..len {
+        let key_len = read_ne_i32(data) as usize;
+        data = data.add(4);
+        let key = read_bytes(data, key_len);
+        data = data.add(key_len);
+        let value_len = read_ne_i32(data) as usize;
+        data = data.add(4);
+        let value = read_bytes(data, value_len);
+        data = data.add(value_len);
+        match key {
+            "ARROW:extension:name" => {
+                extension_name = Some(value.to_string());
+            },
+            "ARROW:extension:metadata" => {
+                extension_metadata = Some(value.to_string());
+            },
+            _ => {
+                result.insert(key.to_string(), value.to_string());
+            },
+        };
+    }
+    let extension = extension_name.map(|name| (name, extension_metadata));
+    (result, extension)
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn test_all() {
+        let mut dts = vec![
+            DataType::Null,
+            DataType::Boolean,
+            DataType::UInt8,
+            DataType::UInt16,
+            DataType::UInt32,
+            DataType::UInt64,
+            DataType::Int8,
+            DataType::Int16,
+            DataType::Int32,
+            DataType::Int64,
+            DataType::Float32,
+            DataType::Float64,
+            DataType::Date32,
+            DataType::Date64,
+            DataType::Time32(TimeUnit::Second),
+            DataType::Time32(TimeUnit::Millisecond),
+            DataType::Time64(TimeUnit::Microsecond),
+            DataType::Time64(TimeUnit::Nanosecond),
+            DataType::Decimal(5, 5),
+            DataType::Utf8,
+            DataType::LargeUtf8,
+            DataType::Binary,
+            DataType::LargeBinary,
+            DataType::FixedSizeBinary(2),
+            DataType::List(Box::new(Field::new("example", DataType::Boolean, false))),
+            DataType::FixedSizeList(Box::new(Field::new("example", DataType::Boolean, false)), 2),
+            DataType::LargeList(Box::new(Field::new("example", DataType::Boolean, false))),
+            DataType::Struct(vec![
+                Field::new("a", DataType::Int64, true),
+                Field::new(
+                    "b",
+                    DataType::List(Box::new(Field::new("item", DataType::Int32, true))),
+                    true,
+                ),
+            ]),
+            DataType::Map(Box::new(Field::new("a", DataType::Int64, true)), true),
+            DataType::Union(
+                vec![
+                    Field::new("a", DataType::Int64, true),
+                    Field::new(
+                        "b",
+                        DataType::List(Box::new(Field::new("item", DataType::Int32, true))),
+                        true,
+                    ),
+                ],
+                Some(vec![1, 2]),
+                UnionMode::Dense,
+            ),
+            DataType::Union(
+                vec![
+                    Field::new("a", DataType::Int64, true),
+                    Field::new(
+                        "b",
+                        DataType::List(Box::new(Field::new("item", DataType::Int32, true))),
+                        true,
+                    ),
+                ],
+                Some(vec![0, 1]),
+                UnionMode::Sparse,
+            ),
+        ];
+        for time_unit in [
+            TimeUnit::Second,
+            TimeUnit::Millisecond,
+            TimeUnit::Microsecond,
+            TimeUnit::Nanosecond,
+        ] {
+            dts.push(DataType::Timestamp(time_unit, None));
+            dts.push(DataType::Timestamp(time_unit, Some("00:00".to_string())));
+            dts.push(DataType::Duration(time_unit));
+        }
+        for interval_type in [
+            IntervalUnit::DayTime,
+            IntervalUnit::YearMonth,
+            //IntervalUnit::MonthDayNano, // not yet defined on the C data interface
+        ] {
+            dts.push(DataType::Interval(interval_type));
+        }
+
+        for expected in dts {
+            let field = Field::new("a", expected.clone(), true);
+            let schema = ArrowSchema::new(&field);
+            let result = unsafe { super::to_data_type(&schema).unwrap() };
+            assert_eq!(result, expected);
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/ffi/stream.rs b/crates/nano-arrow/src/ffi/stream.rs
new file mode 100644
index 000000000000..4776014bca54
--- /dev/null
+++ b/crates/nano-arrow/src/ffi/stream.rs
@@ -0,0 +1,226 @@
+use std::ffi::{CStr, CString};
+use std::ops::DerefMut;
+
+use super::{
+    export_array_to_c, export_field_to_c, import_array_from_c, import_field_from_c, ArrowArray,
+    ArrowArrayStream, ArrowSchema,
+};
+use crate::array::Array;
+use crate::datatypes::Field;
+use crate::error::Error;
+
+impl Drop for ArrowArrayStream {
+    fn drop(&mut self) {
+        match self.release {
+            None => (),
+            Some(release) => unsafe { release(self) },
+        };
+    }
+}
+
+impl ArrowArrayStream {
+    /// Creates an empty [`ArrowArrayStream`] used to import from a producer.
+    pub fn empty() -> Self {
+        Self {
+            get_schema: None,
+            get_next: None,
+            get_last_error: None,
+            release: None,
+            private_data: std::ptr::null_mut(),
+        }
+    }
+}
+
+unsafe fn handle_error(iter: &mut ArrowArrayStream) -> Error {
+    let error = unsafe { (iter.get_last_error.unwrap())(&mut *iter) };
+
+    if error.is_null() {
+        return Error::External(
+            "C stream".to_string(),
+            Box::new(Error::ExternalFormat("an unspecified error".to_string())),
+        );
+    }
+
+    let error = unsafe { CStr::from_ptr(error) };
+    Error::External(
+        "C stream".to_string(),
+        Box::new(Error::ExternalFormat(error.to_str().unwrap().to_string())),
+    )
+}
+
+/// Implements an iterator of [`Array`] consumed from the [C stream interface](https://arrow.apache.org/docs/format/CStreamInterface.html).
+pub struct ArrowArrayStreamReader<Iter: DerefMut<Target = ArrowArrayStream>> {
+    iter: Iter,
+    field: Field,
+}
+
+impl<Iter: DerefMut<Target = ArrowArrayStream>> ArrowArrayStreamReader<Iter> {
+    /// Returns a new [`ArrowArrayStreamReader`]
+    /// # Error
+    /// Errors iff the [`ArrowArrayStream`] is out of specification,
+    /// or was already released prior to calling this function.
+    /// # Safety
+    /// This method is intrinsically `unsafe` since it assumes that the `ArrowArrayStream`
+    /// contains a valid Arrow C stream interface.
+    /// In particular:
+    /// * The `ArrowArrayStream` fulfills the invariants of the C stream interface
+    /// * The schema `get_schema` produces fulfills the C data interface
+    pub unsafe fn try_new(mut iter: Iter) -> Result<Self, Error> {
+        if iter.release.is_none() {
+            return Err(Error::InvalidArgumentError(
+                "The C stream was already released".to_string(),
+            ));
+        };
+
+        if iter.get_next.is_none() {
+            return Err(Error::OutOfSpec(
+                "The C stream MUST contain a non-null get_next".to_string(),
+            ));
+        };
+
+        if iter.get_last_error.is_none() {
+            return Err(Error::OutOfSpec(
+                "The C stream MUST contain a non-null get_last_error".to_string(),
+            ));
+        };
+
+        let mut field = ArrowSchema::empty();
+        let status = if let Some(f) = iter.get_schema {
+            unsafe { (f)(&mut *iter, &mut field) }
+        } else {
+            return Err(Error::OutOfSpec(
+                "The C stream MUST contain a non-null get_schema".to_string(),
+            ));
+        };
+
+        if status != 0 {
+            return Err(unsafe { handle_error(&mut iter) });
+        }
+
+        let field = unsafe { import_field_from_c(&field)? };
+
+        Ok(Self { iter, field })
+    }
+
+    /// Returns the field provided by the stream
+    pub fn field(&self) -> &Field {
+        &self.field
+    }
+
+    /// Advances this iterator by one array
+    /// # Error
+    /// Errors iff:
+    /// * The C stream interface returns an error
+    /// * The C stream interface returns an invalid array (that we can identify, see Safety below)
+    /// # Safety
+    /// Calling this iterator's `next` assumes that the [`ArrowArrayStream`] produces arrow arrays
+    /// that fulfill the C data interface
+    pub unsafe fn next(&mut self) -> Option<Result<Box<dyn Array>, Error>> {
+        let mut array = ArrowArray::empty();
+        let status = unsafe { (self.iter.get_next.unwrap())(&mut *self.iter, &mut array) };
+
+        if status != 0 {
+            return Some(Err(unsafe { handle_error(&mut self.iter) }));
+        }
+
+        // last paragraph of https://arrow.apache.org/docs/format/CStreamInterface.html#c.ArrowArrayStream.get_next
+        array.release?;
+
+        // Safety: assumed from the C stream interface
+        unsafe { import_array_from_c(array, self.field.data_type.clone()) }
+            .map(Some)
+            .transpose()
+    }
+}
+
+struct PrivateData {
+    iter: Box<dyn Iterator<Item = Result<Box<dyn Array>, Error>>>,
+    field: Field,
+    error: Option<CString>,
+}
+
+unsafe extern "C" fn get_next(iter: *mut ArrowArrayStream, array: *mut ArrowArray) -> i32 {
+    if iter.is_null() {
+        return 2001;
+    }
+    let private = &mut *((*iter).private_data as *mut PrivateData);
+
+    match private.iter.next() {
+        Some(Ok(item)) => {
+            // check that the array has the same data_type as field
+            let item_dt = item.data_type();
+            let expected_dt = private.field.data_type();
+            if item_dt != expected_dt {
+                private.error = Some(CString::new(format!("The iterator produced an item of data type {item_dt:?} but the producer expects data type {expected_dt:?}").as_bytes().to_vec()).unwrap());
+                return 2001; // custom application specific error (since this is never a result of this interface)
+            }
+
+            std::ptr::write(array, export_array_to_c(item));
+
+            private.error = None;
+            0
+        },
+        Some(Err(err)) => {
+            private.error = Some(CString::new(err.to_string().as_bytes().to_vec()).unwrap());
+            2001 // custom application specific error (since this is never a result of this interface)
+        },
+        None => {
+            let a = ArrowArray::empty();
+            std::ptr::write_unaligned(array, a);
+            private.error = None;
+            0
+        },
+    }
+}
+
+unsafe extern "C" fn get_schema(iter: *mut ArrowArrayStream, schema: *mut ArrowSchema) -> i32 {
+    if iter.is_null() {
+        return 2001;
+    }
+    let private = &mut *((*iter).private_data as *mut PrivateData);
+
+    std::ptr::write(schema, export_field_to_c(&private.field));
+    0
+}
+
+unsafe extern "C" fn get_last_error(iter: *mut ArrowArrayStream) -> *const ::std::os::raw::c_char {
+    if iter.is_null() {
+        return std::ptr::null();
+    }
+    let private = &mut *((*iter).private_data as *mut PrivateData);
+
+    private
+        .error
+        .as_ref()
+        .map(|x| x.as_ptr())
+        .unwrap_or(std::ptr::null())
+}
+
+unsafe extern "C" fn release(iter: *mut ArrowArrayStream) {
+    if iter.is_null() {
+        return;
+    }
+    let _ = Box::from_raw((*iter).private_data as *mut PrivateData);
+    (*iter).release = None;
+    // private drops automatically
+}
+
+/// Exports an iterator to the [C stream interface](https://arrow.apache.org/docs/format/CStreamInterface.html)
+pub fn export_iterator(
+    iter: Box<dyn Iterator<Item = Result<Box<dyn Array>, Error>>>,
+    field: Field,
+) -> ArrowArrayStream {
+    let private_data = Box::new(PrivateData {
+        iter,
+        field,
+        error: None,
+    });
+
+    ArrowArrayStream {
+        get_schema: Some(get_schema),
+        get_next: Some(get_next),
+        get_last_error: Some(get_last_error),
+        release: Some(release),
+        private_data: Box::into_raw(private_data) as *mut ::std::os::raw::c_void,
+    }
+}
diff --git a/crates/nano-arrow/src/io/README.md b/crates/nano-arrow/src/io/README.md
new file mode 100644
index 000000000000..a3c7599b8bdf
--- /dev/null
+++ b/crates/nano-arrow/src/io/README.md
@@ -0,0 +1,24 @@
+# IO module
+
+This document describes the overall design of this module.
+
+## Rules:
+
+- Each directory in this module corresponds to a specific format such as `csv` and `json`.
+- directories that depend on external dependencies MUST be feature gated, with a feature named with a prefix `io_`.
+- modules MUST re-export any API of external dependencies they require as part of their public API.
+  E.g.
+  - if a module as an API `write(writer: &mut csv:Writer<W>, ...)`, it MUST contain `pub use csv::Writer;`.
+
+  The rational is that adding this crate to `cargo.toml` must be sufficient to use it.
+- Each directory SHOULD contain two directories, `read` and `write`, corresponding
+  to functionality about reading from the format and writing to the format respectively.
+- The base module SHOULD contain `use pub read;` and `use pub write;`.
+- Implementations SHOULD separate reading of "data" from reading of "metadata". Examples:
+  - schema read or inference SHOULD be a separate function
+  - functions that read "data" SHOULD consume a schema typically pre-read.
+- Implementations SHOULD separate IO-bounded operations from CPU-bounded operations.
+  I.e. implementations SHOULD:
+  - contain functions that consume a `Read` implementor and output a "raw" struct, i.e. a struct that is e.g. compressed and serialized
+  - contain functions that consume a "raw" struct and convert it into Arrow.
+  - offer each of these functions as independent public APIs, so that consumers can decide how to balance CPU-bounds and IO-bounds.
diff --git a/crates/nano-arrow/src/io/avro/mod.rs b/crates/nano-arrow/src/io/avro/mod.rs
new file mode 100644
index 000000000000..bf7bda85f197
--- /dev/null
+++ b/crates/nano-arrow/src/io/avro/mod.rs
@@ -0,0 +1,42 @@
+//! Read and write from and to Apache Avro
+
+pub use avro_schema;
+
+impl From<avro_schema::error::Error> for crate::error::Error {
+    fn from(error: avro_schema::error::Error) -> Self {
+        Self::ExternalFormat(error.to_string())
+    }
+}
+
+pub mod read;
+pub mod write;
+
+// macros that can operate in sync and async code.
+macro_rules! avro_decode {
+    ($reader:ident $($_await:tt)*) => {
+        {
+            let mut i = 0u64;
+            let mut buf = [0u8; 1];
+            let mut j = 0;
+            loop {
+                if j > 9 {
+                    // if j * 7 > 64
+                    return Err(Error::ExternalFormat(
+                        "zigzag decoding failed - corrupt avro file".to_string(),
+                    ));
+                }
+                $reader.read_exact(&mut buf[..])$($_await)*?;
+                i |= (u64::from(buf[0] & 0x7F)) << (j * 7);
+                if (buf[0] >> 7) == 0 {
+                    break;
+                } else {
+                    j += 1;
+                }
+            }
+
+            Ok(i)
+        }
+    }
+}
+
+pub(crate) use avro_decode;
diff --git a/crates/nano-arrow/src/io/avro/read/deserialize.rs b/crates/nano-arrow/src/io/avro/read/deserialize.rs
new file mode 100644
index 000000000000..6cafd9d8c4c1
--- /dev/null
+++ b/crates/nano-arrow/src/io/avro/read/deserialize.rs
@@ -0,0 +1,526 @@
+use std::convert::TryInto;
+
+use avro_schema::file::Block;
+use avro_schema::schema::{Enum, Field as AvroField, Record, Schema as AvroSchema};
+
+use super::nested::*;
+use super::util;
+use crate::array::*;
+use crate::chunk::Chunk;
+use crate::datatypes::*;
+use crate::error::{Error, Result};
+use crate::types::months_days_ns;
+
+fn make_mutable(
+    data_type: &DataType,
+    avro_field: Option<&AvroSchema>,
+    capacity: usize,
+) -> Result<Box<dyn MutableArray>> {
+    Ok(match data_type.to_physical_type() {
+        PhysicalType::Boolean => {
+            Box::new(MutableBooleanArray::with_capacity(capacity)) as Box<dyn MutableArray>
+        },
+        PhysicalType::Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+            Box::new(MutablePrimitiveArray::<$T>::with_capacity(capacity).to(data_type.clone()))
+                as Box<dyn MutableArray>
+        }),
+        PhysicalType::Binary => {
+            Box::new(MutableBinaryArray::<i32>::with_capacity(capacity)) as Box<dyn MutableArray>
+        },
+        PhysicalType::Utf8 => {
+            Box::new(MutableUtf8Array::<i32>::with_capacity(capacity)) as Box<dyn MutableArray>
+        },
+        PhysicalType::Dictionary(_) => {
+            if let Some(AvroSchema::Enum(Enum { symbols, .. })) = avro_field {
+                let values = Utf8Array::<i32>::from_slice(symbols);
+                Box::new(FixedItemsUtf8Dictionary::with_capacity(values, capacity))
+                    as Box<dyn MutableArray>
+            } else {
+                unreachable!()
+            }
+        },
+        _ => match data_type {
+            DataType::List(inner) => {
+                let values = make_mutable(inner.data_type(), None, 0)?;
+                Box::new(DynMutableListArray::<i32>::new_from(
+                    values,
+                    data_type.clone(),
+                    capacity,
+                )) as Box<dyn MutableArray>
+            },
+            DataType::FixedSizeBinary(size) => {
+                Box::new(MutableFixedSizeBinaryArray::with_capacity(*size, capacity))
+                    as Box<dyn MutableArray>
+            },
+            DataType::Struct(fields) => {
+                let values = fields
+                    .iter()
+                    .map(|field| make_mutable(field.data_type(), None, capacity))
+                    .collect::<Result<Vec<_>>>()?;
+                Box::new(DynMutableStructArray::new(values, data_type.clone()))
+                    as Box<dyn MutableArray>
+            },
+            other => {
+                return Err(Error::NotYetImplemented(format!(
+                    "Deserializing type {other:#?} is still not implemented"
+                )))
+            },
+        },
+    })
+}
+
+fn is_union_null_first(avro_field: &AvroSchema) -> bool {
+    if let AvroSchema::Union(schemas) = avro_field {
+        schemas[0] == AvroSchema::Null
+    } else {
+        unreachable!()
+    }
+}
+
+fn deserialize_item<'a>(
+    array: &mut dyn MutableArray,
+    is_nullable: bool,
+    avro_field: &AvroSchema,
+    mut block: &'a [u8],
+) -> Result<&'a [u8]> {
+    if is_nullable {
+        let variant = util::zigzag_i64(&mut block)?;
+        let is_null_first = is_union_null_first(avro_field);
+        if is_null_first && variant == 0 || !is_null_first && variant != 0 {
+            array.push_null();
+            return Ok(block);
+        }
+    }
+    deserialize_value(array, avro_field, block)
+}
+
+fn deserialize_value<'a>(
+    array: &mut dyn MutableArray,
+    avro_field: &AvroSchema,
+    mut block: &'a [u8],
+) -> Result<&'a [u8]> {
+    let data_type = array.data_type();
+    match data_type {
+        DataType::List(inner) => {
+            let is_nullable = inner.is_nullable;
+            let avro_inner = match avro_field {
+                AvroSchema::Array(inner) => inner.as_ref(),
+                AvroSchema::Union(u) => match &u.as_slice() {
+                    &[AvroSchema::Array(inner), _] | &[_, AvroSchema::Array(inner)] => {
+                        inner.as_ref()
+                    },
+                    _ => unreachable!(),
+                },
+                _ => unreachable!(),
+            };
+
+            let array = array
+                .as_mut_any()
+                .downcast_mut::<DynMutableListArray<i32>>()
+                .unwrap();
+            // Arrays are encoded as a series of blocks.
+            loop {
+                // Each block consists of a long count value, followed by that many array items.
+                let len = util::zigzag_i64(&mut block)?;
+                let len = if len < 0 {
+                    // Avro spec: If a block's count is negative, its absolute value is used,
+                    // and the count is followed immediately by a long block size indicating the number of bytes in the block. This block size permits fast skipping through data, e.g., when projecting a record to a subset of its fields.
+                    let _ = util::zigzag_i64(&mut block)?;
+
+                    -len
+                } else {
+                    len
+                };
+
+                // A block with count zero indicates the end of the array.
+                if len == 0 {
+                    break;
+                }
+
+                // Each item is encoded per the array’s item schema.
+                let values = array.mut_values();
+                for _ in 0..len {
+                    block = deserialize_item(values, is_nullable, avro_inner, block)?;
+                }
+            }
+            array.try_push_valid()?;
+        },
+        DataType::Struct(inner_fields) => {
+            let fields = match avro_field {
+                AvroSchema::Record(Record { fields, .. }) => fields,
+                AvroSchema::Union(u) => match &u.as_slice() {
+                    &[AvroSchema::Record(Record { fields, .. }), _]
+                    | &[_, AvroSchema::Record(Record { fields, .. })] => fields,
+                    _ => unreachable!(),
+                },
+                _ => unreachable!(),
+            };
+
+            let is_nullable = inner_fields
+                .iter()
+                .map(|x| x.is_nullable)
+                .collect::<Vec<_>>();
+            let array = array
+                .as_mut_any()
+                .downcast_mut::<DynMutableStructArray>()
+                .unwrap();
+
+            for (index, (field, is_nullable)) in fields.iter().zip(is_nullable.iter()).enumerate() {
+                let values = array.mut_values(index);
+                block = deserialize_item(values, *is_nullable, &field.schema, block)?;
+            }
+            array.try_push_valid()?;
+        },
+        _ => match data_type.to_physical_type() {
+            PhysicalType::Boolean => {
+                let is_valid = block[0] == 1;
+                block = &block[1..];
+                let array = array
+                    .as_mut_any()
+                    .downcast_mut::<MutableBooleanArray>()
+                    .unwrap();
+                array.push(Some(is_valid))
+            },
+            PhysicalType::Primitive(primitive) => match primitive {
+                PrimitiveType::Int32 => {
+                    let value = util::zigzag_i64(&mut block)? as i32;
+                    let array = array
+                        .as_mut_any()
+                        .downcast_mut::<MutablePrimitiveArray<i32>>()
+                        .unwrap();
+                    array.push(Some(value))
+                },
+                PrimitiveType::Int64 => {
+                    let value = util::zigzag_i64(&mut block)?;
+                    let array = array
+                        .as_mut_any()
+                        .downcast_mut::<MutablePrimitiveArray<i64>>()
+                        .unwrap();
+                    array.push(Some(value))
+                },
+                PrimitiveType::Float32 => {
+                    let value =
+                        f32::from_le_bytes(block[..std::mem::size_of::<f32>()].try_into().unwrap());
+                    block = &block[std::mem::size_of::<f32>()..];
+                    let array = array
+                        .as_mut_any()
+                        .downcast_mut::<MutablePrimitiveArray<f32>>()
+                        .unwrap();
+                    array.push(Some(value))
+                },
+                PrimitiveType::Float64 => {
+                    let value =
+                        f64::from_le_bytes(block[..std::mem::size_of::<f64>()].try_into().unwrap());
+                    block = &block[std::mem::size_of::<f64>()..];
+                    let array = array
+                        .as_mut_any()
+                        .downcast_mut::<MutablePrimitiveArray<f64>>()
+                        .unwrap();
+                    array.push(Some(value))
+                },
+                PrimitiveType::MonthDayNano => {
+                    // https://avro.apache.org/docs/current/spec.html#Duration
+                    // 12 bytes, months, days, millis in LE
+                    let data = &block[..12];
+                    block = &block[12..];
+
+                    let value = months_days_ns::new(
+                        i32::from_le_bytes([data[0], data[1], data[2], data[3]]),
+                        i32::from_le_bytes([data[4], data[5], data[6], data[7]]),
+                        i32::from_le_bytes([data[8], data[9], data[10], data[11]]) as i64
+                            * 1_000_000,
+                    );
+
+                    let array = array
+                        .as_mut_any()
+                        .downcast_mut::<MutablePrimitiveArray<months_days_ns>>()
+                        .unwrap();
+                    array.push(Some(value))
+                },
+                PrimitiveType::Int128 => {
+                    let avro_inner = match avro_field {
+                        AvroSchema::Bytes(_) | AvroSchema::Fixed(_) => avro_field,
+                        AvroSchema::Union(u) => match &u.as_slice() {
+                            &[e, AvroSchema::Null] | &[AvroSchema::Null, e] => e,
+                            _ => unreachable!(),
+                        },
+                        _ => unreachable!(),
+                    };
+                    let len = match avro_inner {
+                        AvroSchema::Bytes(_) => {
+                            util::zigzag_i64(&mut block)?.try_into().map_err(|_| {
+                                Error::ExternalFormat(
+                                    "Avro format contains a non-usize number of bytes".to_string(),
+                                )
+                            })?
+                        },
+                        AvroSchema::Fixed(b) => b.size,
+                        _ => unreachable!(),
+                    };
+                    if len > 16 {
+                        return Err(Error::ExternalFormat(
+                            "Avro decimal bytes return more than 16 bytes".to_string(),
+                        ));
+                    }
+                    let mut bytes = [0u8; 16];
+                    bytes[..len].copy_from_slice(&block[..len]);
+                    block = &block[len..];
+                    let data = i128::from_be_bytes(bytes) >> (8 * (16 - len));
+                    let array = array
+                        .as_mut_any()
+                        .downcast_mut::<MutablePrimitiveArray<i128>>()
+                        .unwrap();
+                    array.push(Some(data))
+                },
+                _ => unreachable!(),
+            },
+            PhysicalType::Utf8 => {
+                let len: usize = util::zigzag_i64(&mut block)?.try_into().map_err(|_| {
+                    Error::ExternalFormat(
+                        "Avro format contains a non-usize number of bytes".to_string(),
+                    )
+                })?;
+                let data = simdutf8::basic::from_utf8(&block[..len])?;
+                block = &block[len..];
+
+                let array = array
+                    .as_mut_any()
+                    .downcast_mut::<MutableUtf8Array<i32>>()
+                    .unwrap();
+                array.push(Some(data))
+            },
+            PhysicalType::Binary => {
+                let len: usize = util::zigzag_i64(&mut block)?.try_into().map_err(|_| {
+                    Error::ExternalFormat(
+                        "Avro format contains a non-usize number of bytes".to_string(),
+                    )
+                })?;
+                let data = &block[..len];
+                block = &block[len..];
+
+                let array = array
+                    .as_mut_any()
+                    .downcast_mut::<MutableBinaryArray<i32>>()
+                    .unwrap();
+                array.push(Some(data));
+            },
+            PhysicalType::FixedSizeBinary => {
+                let array = array
+                    .as_mut_any()
+                    .downcast_mut::<MutableFixedSizeBinaryArray>()
+                    .unwrap();
+                let len = array.size();
+                let data = &block[..len];
+                block = &block[len..];
+                array.push(Some(data));
+            },
+            PhysicalType::Dictionary(_) => {
+                let index = util::zigzag_i64(&mut block)? as i32;
+                let array = array
+                    .as_mut_any()
+                    .downcast_mut::<FixedItemsUtf8Dictionary>()
+                    .unwrap();
+                array.push_valid(index);
+            },
+            _ => todo!(),
+        },
+    };
+    Ok(block)
+}
+
+fn skip_item<'a>(field: &Field, avro_field: &AvroSchema, mut block: &'a [u8]) -> Result<&'a [u8]> {
+    if field.is_nullable {
+        let variant = util::zigzag_i64(&mut block)?;
+        let is_null_first = is_union_null_first(avro_field);
+        if is_null_first && variant == 0 || !is_null_first && variant != 0 {
+            return Ok(block);
+        }
+    }
+    match &field.data_type {
+        DataType::List(inner) => {
+            let avro_inner = match avro_field {
+                AvroSchema::Array(inner) => inner.as_ref(),
+                AvroSchema::Union(u) => match &u.as_slice() {
+                    &[AvroSchema::Array(inner), _] | &[_, AvroSchema::Array(inner)] => {
+                        inner.as_ref()
+                    },
+                    _ => unreachable!(),
+                },
+                _ => unreachable!(),
+            };
+
+            loop {
+                let len = util::zigzag_i64(&mut block)?;
+                let (len, bytes) = if len < 0 {
+                    // Avro spec: If a block's count is negative, its absolute value is used,
+                    // and the count is followed immediately by a long block size indicating the number of bytes in the block. This block size permits fast skipping through data, e.g., when projecting a record to a subset of its fields.
+                    let bytes = util::zigzag_i64(&mut block)?;
+
+                    (-len, Some(bytes))
+                } else {
+                    (len, None)
+                };
+
+                let bytes: Option<usize> = bytes
+                    .map(|bytes| {
+                        bytes
+                            .try_into()
+                            .map_err(|_| Error::oos("Avro block size negative or too large"))
+                    })
+                    .transpose()?;
+
+                if len == 0 {
+                    break;
+                }
+
+                if let Some(bytes) = bytes {
+                    block = &block[bytes..];
+                } else {
+                    for _ in 0..len {
+                        block = skip_item(inner, avro_inner, block)?;
+                    }
+                }
+            }
+        },
+        DataType::Struct(inner_fields) => {
+            let fields = match avro_field {
+                AvroSchema::Record(Record { fields, .. }) => fields,
+                AvroSchema::Union(u) => match &u.as_slice() {
+                    &[AvroSchema::Record(Record { fields, .. }), _]
+                    | &[_, AvroSchema::Record(Record { fields, .. })] => fields,
+                    _ => unreachable!(),
+                },
+                _ => unreachable!(),
+            };
+
+            for (field, avro_field) in inner_fields.iter().zip(fields.iter()) {
+                block = skip_item(field, &avro_field.schema, block)?;
+            }
+        },
+        _ => match field.data_type.to_physical_type() {
+            PhysicalType::Boolean => {
+                let _ = block[0] == 1;
+                block = &block[1..];
+            },
+            PhysicalType::Primitive(primitive) => match primitive {
+                PrimitiveType::Int32 => {
+                    let _ = util::zigzag_i64(&mut block)?;
+                },
+                PrimitiveType::Int64 => {
+                    let _ = util::zigzag_i64(&mut block)?;
+                },
+                PrimitiveType::Float32 => {
+                    block = &block[std::mem::size_of::<f32>()..];
+                },
+                PrimitiveType::Float64 => {
+                    block = &block[std::mem::size_of::<f64>()..];
+                },
+                PrimitiveType::MonthDayNano => {
+                    block = &block[12..];
+                },
+                PrimitiveType::Int128 => {
+                    let avro_inner = match avro_field {
+                        AvroSchema::Bytes(_) | AvroSchema::Fixed(_) => avro_field,
+                        AvroSchema::Union(u) => match &u.as_slice() {
+                            &[e, AvroSchema::Null] | &[AvroSchema::Null, e] => e,
+                            _ => unreachable!(),
+                        },
+                        _ => unreachable!(),
+                    };
+                    let len = match avro_inner {
+                        AvroSchema::Bytes(_) => {
+                            util::zigzag_i64(&mut block)?.try_into().map_err(|_| {
+                                Error::ExternalFormat(
+                                    "Avro format contains a non-usize number of bytes".to_string(),
+                                )
+                            })?
+                        },
+                        AvroSchema::Fixed(b) => b.size,
+                        _ => unreachable!(),
+                    };
+                    block = &block[len..];
+                },
+                _ => unreachable!(),
+            },
+            PhysicalType::Utf8 | PhysicalType::Binary => {
+                let len: usize = util::zigzag_i64(&mut block)?.try_into().map_err(|_| {
+                    Error::ExternalFormat(
+                        "Avro format contains a non-usize number of bytes".to_string(),
+                    )
+                })?;
+                block = &block[len..];
+            },
+            PhysicalType::FixedSizeBinary => {
+                let len = if let DataType::FixedSizeBinary(len) = &field.data_type {
+                    *len
+                } else {
+                    unreachable!()
+                };
+
+                block = &block[len..];
+            },
+            PhysicalType::Dictionary(_) => {
+                let _ = util::zigzag_i64(&mut block)? as i32;
+            },
+            _ => todo!(),
+        },
+    }
+    Ok(block)
+}
+
+/// Deserializes a [`Block`] assumed to be encoded according to [`AvroField`] into [`Chunk`],
+/// using `projection` to ignore `avro_fields`.
+/// # Panics
+/// `fields`, `avro_fields` and `projection` must have the same length.
+pub fn deserialize(
+    block: &Block,
+    fields: &[Field],
+    avro_fields: &[AvroField],
+    projection: &[bool],
+) -> Result<Chunk<Box<dyn Array>>> {
+    assert_eq!(fields.len(), avro_fields.len());
+    assert_eq!(fields.len(), projection.len());
+
+    let rows = block.number_of_rows;
+    let mut block = block.data.as_ref();
+
+    // create mutables, one per field
+    let mut arrays: Vec<Box<dyn MutableArray>> = fields
+        .iter()
+        .zip(avro_fields.iter())
+        .zip(projection.iter())
+        .map(|((field, avro_field), projection)| {
+            if *projection {
+                make_mutable(&field.data_type, Some(&avro_field.schema), rows)
+            } else {
+                // just something; we are not going to use it
+                make_mutable(&DataType::Int32, None, 0)
+            }
+        })
+        .collect::<Result<_>>()?;
+
+    // this is _the_ expensive transpose (rows -> columns)
+    for _ in 0..rows {
+        let iter = arrays
+            .iter_mut()
+            .zip(fields.iter())
+            .zip(avro_fields.iter())
+            .zip(projection.iter());
+
+        for (((array, field), avro_field), projection) in iter {
+            block = if *projection {
+                deserialize_item(array.as_mut(), field.is_nullable, &avro_field.schema, block)
+            } else {
+                skip_item(field, &avro_field.schema, block)
+            }?
+        }
+    }
+    Chunk::try_new(
+        arrays
+            .iter_mut()
+            .zip(projection.iter())
+            .filter_map(|x| x.1.then(|| x.0))
+            .map(|array| array.as_box())
+            .collect(),
+    )
+}
diff --git a/crates/nano-arrow/src/io/avro/read/mod.rs b/crates/nano-arrow/src/io/avro/read/mod.rs
new file mode 100644
index 000000000000..5014499c12a6
--- /dev/null
+++ b/crates/nano-arrow/src/io/avro/read/mod.rs
@@ -0,0 +1,67 @@
+//! APIs to read from Avro format to arrow.
+use std::io::Read;
+
+use avro_schema::file::FileMetadata;
+use avro_schema::read::fallible_streaming_iterator::FallibleStreamingIterator;
+use avro_schema::read::{block_iterator, BlockStreamingIterator};
+use avro_schema::schema::Field as AvroField;
+
+mod deserialize;
+pub use deserialize::deserialize;
+mod nested;
+mod schema;
+mod util;
+
+pub use schema::infer_schema;
+
+use crate::array::Array;
+use crate::chunk::Chunk;
+use crate::datatypes::Field;
+use crate::error::Result;
+
+/// Single threaded, blocking reader of Avro; [`Iterator`] of [`Chunk`].
+pub struct Reader<R: Read> {
+    iter: BlockStreamingIterator<R>,
+    avro_fields: Vec<AvroField>,
+    fields: Vec<Field>,
+    projection: Vec<bool>,
+}
+
+impl<R: Read> Reader<R> {
+    /// Creates a new [`Reader`].
+    pub fn new(
+        reader: R,
+        metadata: FileMetadata,
+        fields: Vec<Field>,
+        projection: Option<Vec<bool>>,
+    ) -> Self {
+        let projection = projection.unwrap_or_else(|| fields.iter().map(|_| true).collect());
+
+        Self {
+            iter: block_iterator(reader, metadata.compression, metadata.marker),
+            avro_fields: metadata.record.fields,
+            fields,
+            projection,
+        }
+    }
+
+    /// Deconstructs itself into its internal reader
+    pub fn into_inner(self) -> R {
+        self.iter.into_inner()
+    }
+}
+
+impl<R: Read> Iterator for Reader<R> {
+    type Item = Result<Chunk<Box<dyn Array>>>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        let fields = &self.fields[..];
+        let avro_fields = &self.avro_fields;
+        let projection = &self.projection;
+
+        self.iter
+            .next()
+            .transpose()
+            .map(|maybe_block| deserialize(maybe_block?, fields, avro_fields, projection))
+    }
+}
diff --git a/crates/nano-arrow/src/io/avro/read/nested.rs b/crates/nano-arrow/src/io/avro/read/nested.rs
new file mode 100644
index 000000000000..056d9a8f836e
--- /dev/null
+++ b/crates/nano-arrow/src/io/avro/read/nested.rs
@@ -0,0 +1,309 @@
+use crate::array::*;
+use crate::bitmap::*;
+use crate::datatypes::*;
+use crate::error::*;
+use crate::offset::{Offset, Offsets};
+
+/// Auxiliary struct
+#[derive(Debug)]
+pub struct DynMutableListArray<O: Offset> {
+    data_type: DataType,
+    offsets: Offsets<O>,
+    values: Box<dyn MutableArray>,
+    validity: Option<MutableBitmap>,
+}
+
+impl<O: Offset> DynMutableListArray<O> {
+    pub fn new_from(values: Box<dyn MutableArray>, data_type: DataType, capacity: usize) -> Self {
+        assert_eq!(values.len(), 0);
+        ListArray::<O>::get_child_field(&data_type);
+        Self {
+            data_type,
+            offsets: Offsets::<O>::with_capacity(capacity),
+            values,
+            validity: None,
+        }
+    }
+
+    /// The values
+    pub fn mut_values(&mut self) -> &mut dyn MutableArray {
+        self.values.as_mut()
+    }
+
+    #[inline]
+    pub fn try_push_valid(&mut self) -> Result<()> {
+        let total_length = self.values.len();
+        let offset = self.offsets.last().to_usize();
+        let length = total_length.checked_sub(offset).ok_or(Error::Overflow)?;
+
+        self.offsets.try_push_usize(length)?;
+        if let Some(validity) = &mut self.validity {
+            validity.push(true)
+        }
+        Ok(())
+    }
+
+    #[inline]
+    fn push_null(&mut self) {
+        self.offsets.extend_constant(1);
+        match &mut self.validity {
+            Some(validity) => validity.push(false),
+            None => self.init_validity(),
+        }
+    }
+
+    fn init_validity(&mut self) {
+        let len = self.offsets.len_proxy();
+
+        let mut validity = MutableBitmap::new();
+        validity.extend_constant(len, true);
+        validity.set(len - 1, false);
+        self.validity = Some(validity)
+    }
+}
+
+impl<O: Offset> MutableArray for DynMutableListArray<O> {
+    fn len(&self) -> usize {
+        self.offsets.len_proxy()
+    }
+
+    fn validity(&self) -> Option<&MutableBitmap> {
+        self.validity.as_ref()
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        ListArray::new(
+            self.data_type.clone(),
+            std::mem::take(&mut self.offsets).into(),
+            self.values.as_box(),
+            std::mem::take(&mut self.validity).map(|x| x.into()),
+        )
+        .boxed()
+    }
+
+    fn as_arc(&mut self) -> std::sync::Arc<dyn Array> {
+        ListArray::new(
+            self.data_type.clone(),
+            std::mem::take(&mut self.offsets).into(),
+            self.values.as_box(),
+            std::mem::take(&mut self.validity).map(|x| x.into()),
+        )
+        .arced()
+    }
+
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    fn as_mut_any(&mut self) -> &mut dyn std::any::Any {
+        self
+    }
+
+    #[inline]
+    fn push_null(&mut self) {
+        self.push_null()
+    }
+
+    fn reserve(&mut self, _: usize) {
+        todo!();
+    }
+
+    fn shrink_to_fit(&mut self) {
+        todo!();
+    }
+}
+
+#[derive(Debug)]
+pub struct FixedItemsUtf8Dictionary {
+    data_type: DataType,
+    keys: MutablePrimitiveArray<i32>,
+    values: Utf8Array<i32>,
+}
+
+impl FixedItemsUtf8Dictionary {
+    pub fn with_capacity(values: Utf8Array<i32>, capacity: usize) -> Self {
+        Self {
+            data_type: DataType::Dictionary(
+                IntegerType::Int32,
+                Box::new(values.data_type().clone()),
+                false,
+            ),
+            keys: MutablePrimitiveArray::<i32>::with_capacity(capacity),
+            values,
+        }
+    }
+
+    pub fn push_valid(&mut self, key: i32) {
+        self.keys.push(Some(key))
+    }
+
+    /// pushes a null value
+    pub fn push_null(&mut self) {
+        self.keys.push(None)
+    }
+}
+
+impl MutableArray for FixedItemsUtf8Dictionary {
+    fn len(&self) -> usize {
+        self.keys.len()
+    }
+
+    fn validity(&self) -> Option<&MutableBitmap> {
+        self.keys.validity()
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        Box::new(
+            DictionaryArray::try_new(
+                self.data_type.clone(),
+                std::mem::take(&mut self.keys).into(),
+                Box::new(self.values.clone()),
+            )
+            .unwrap(),
+        )
+    }
+
+    fn as_arc(&mut self) -> std::sync::Arc<dyn Array> {
+        std::sync::Arc::new(
+            DictionaryArray::try_new(
+                self.data_type.clone(),
+                std::mem::take(&mut self.keys).into(),
+                Box::new(self.values.clone()),
+            )
+            .unwrap(),
+        )
+    }
+
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    fn as_mut_any(&mut self) -> &mut dyn std::any::Any {
+        self
+    }
+
+    #[inline]
+    fn push_null(&mut self) {
+        self.push_null()
+    }
+
+    fn reserve(&mut self, _: usize) {
+        todo!();
+    }
+
+    fn shrink_to_fit(&mut self) {
+        todo!();
+    }
+}
+
+/// Auxiliary struct
+#[derive(Debug)]
+pub struct DynMutableStructArray {
+    data_type: DataType,
+    values: Vec<Box<dyn MutableArray>>,
+    validity: Option<MutableBitmap>,
+}
+
+impl DynMutableStructArray {
+    pub fn new(values: Vec<Box<dyn MutableArray>>, data_type: DataType) -> Self {
+        Self {
+            data_type,
+            values,
+            validity: None,
+        }
+    }
+
+    /// The values
+    pub fn mut_values(&mut self, field: usize) -> &mut dyn MutableArray {
+        self.values[field].as_mut()
+    }
+
+    #[inline]
+    pub fn try_push_valid(&mut self) -> Result<()> {
+        if let Some(validity) = &mut self.validity {
+            validity.push(true)
+        }
+        Ok(())
+    }
+
+    #[inline]
+    fn push_null(&mut self) {
+        self.values.iter_mut().for_each(|x| x.push_null());
+        match &mut self.validity {
+            Some(validity) => validity.push(false),
+            None => self.init_validity(),
+        }
+    }
+
+    fn init_validity(&mut self) {
+        let len = self.len();
+
+        let mut validity = MutableBitmap::new();
+        validity.extend_constant(len, true);
+        validity.set(len - 1, false);
+        self.validity = Some(validity)
+    }
+}
+
+impl MutableArray for DynMutableStructArray {
+    fn len(&self) -> usize {
+        self.values[0].len()
+    }
+
+    fn validity(&self) -> Option<&MutableBitmap> {
+        self.validity.as_ref()
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        let values = self.values.iter_mut().map(|x| x.as_box()).collect();
+
+        Box::new(StructArray::new(
+            self.data_type.clone(),
+            values,
+            std::mem::take(&mut self.validity).map(|x| x.into()),
+        ))
+    }
+
+    fn as_arc(&mut self) -> std::sync::Arc<dyn Array> {
+        let values = self.values.iter_mut().map(|x| x.as_box()).collect();
+
+        std::sync::Arc::new(StructArray::new(
+            self.data_type.clone(),
+            values,
+            std::mem::take(&mut self.validity).map(|x| x.into()),
+        ))
+    }
+
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    fn as_mut_any(&mut self) -> &mut dyn std::any::Any {
+        self
+    }
+
+    #[inline]
+    fn push_null(&mut self) {
+        self.push_null()
+    }
+
+    fn reserve(&mut self, _: usize) {
+        todo!();
+    }
+
+    fn shrink_to_fit(&mut self) {
+        todo!();
+    }
+}
diff --git a/crates/nano-arrow/src/io/avro/read/schema.rs b/crates/nano-arrow/src/io/avro/read/schema.rs
new file mode 100644
index 000000000000..ca50c59ca9fa
--- /dev/null
+++ b/crates/nano-arrow/src/io/avro/read/schema.rs
@@ -0,0 +1,145 @@
+use avro_schema::schema::{Enum, Fixed, Record, Schema as AvroSchema};
+
+use crate::datatypes::*;
+use crate::error::{Error, Result};
+
+fn external_props(schema: &AvroSchema) -> Metadata {
+    let mut props = Metadata::new();
+    match &schema {
+        AvroSchema::Record(Record {
+            doc: Some(ref doc), ..
+        })
+        | AvroSchema::Enum(Enum {
+            doc: Some(ref doc), ..
+        }) => {
+            props.insert("avro::doc".to_string(), doc.clone());
+        },
+        _ => {},
+    }
+    props
+}
+
+/// Infers an [`Schema`] from the root [`Record`].
+/// This
+pub fn infer_schema(record: &Record) -> Result<Schema> {
+    Ok(record
+        .fields
+        .iter()
+        .map(|field| {
+            schema_to_field(
+                &field.schema,
+                Some(&field.name),
+                external_props(&field.schema),
+            )
+        })
+        .collect::<Result<Vec<_>>>()?
+        .into())
+}
+
+fn schema_to_field(schema: &AvroSchema, name: Option<&str>, props: Metadata) -> Result<Field> {
+    let mut nullable = false;
+    let data_type = match schema {
+        AvroSchema::Null => DataType::Null,
+        AvroSchema::Boolean => DataType::Boolean,
+        AvroSchema::Int(logical) => match logical {
+            Some(logical) => match logical {
+                avro_schema::schema::IntLogical::Date => DataType::Date32,
+                avro_schema::schema::IntLogical::Time => DataType::Time32(TimeUnit::Millisecond),
+            },
+            None => DataType::Int32,
+        },
+        AvroSchema::Long(logical) => match logical {
+            Some(logical) => match logical {
+                avro_schema::schema::LongLogical::Time => DataType::Time64(TimeUnit::Microsecond),
+                avro_schema::schema::LongLogical::TimestampMillis => {
+                    DataType::Timestamp(TimeUnit::Millisecond, Some("00:00".to_string()))
+                },
+                avro_schema::schema::LongLogical::TimestampMicros => {
+                    DataType::Timestamp(TimeUnit::Microsecond, Some("00:00".to_string()))
+                },
+                avro_schema::schema::LongLogical::LocalTimestampMillis => {
+                    DataType::Timestamp(TimeUnit::Millisecond, None)
+                },
+                avro_schema::schema::LongLogical::LocalTimestampMicros => {
+                    DataType::Timestamp(TimeUnit::Microsecond, None)
+                },
+            },
+            None => DataType::Int64,
+        },
+        AvroSchema::Float => DataType::Float32,
+        AvroSchema::Double => DataType::Float64,
+        AvroSchema::Bytes(logical) => match logical {
+            Some(logical) => match logical {
+                avro_schema::schema::BytesLogical::Decimal(precision, scale) => {
+                    DataType::Decimal(*precision, *scale)
+                },
+            },
+            None => DataType::Binary,
+        },
+        AvroSchema::String(_) => DataType::Utf8,
+        AvroSchema::Array(item_schema) => DataType::List(Box::new(schema_to_field(
+            item_schema,
+            Some("item"), // default name for list items
+            Metadata::default(),
+        )?)),
+        AvroSchema::Map(_) => todo!("Avro maps are mapped to MapArrays"),
+        AvroSchema::Union(schemas) => {
+            // If there are only two variants and one of them is null, set the other type as the field data type
+            let has_nullable = schemas.iter().any(|x| x == &AvroSchema::Null);
+            if has_nullable && schemas.len() == 2 {
+                nullable = true;
+                if let Some(schema) = schemas
+                    .iter()
+                    .find(|&schema| !matches!(schema, AvroSchema::Null))
+                {
+                    schema_to_field(schema, None, Metadata::default())?.data_type
+                } else {
+                    return Err(Error::NotYetImplemented(format!(
+                        "Can't read avro union {schema:?}"
+                    )));
+                }
+            } else {
+                let fields = schemas
+                    .iter()
+                    .map(|s| schema_to_field(s, None, Metadata::default()))
+                    .collect::<Result<Vec<Field>>>()?;
+                DataType::Union(fields, None, UnionMode::Dense)
+            }
+        },
+        AvroSchema::Record(Record { fields, .. }) => {
+            let fields = fields
+                .iter()
+                .map(|field| {
+                    let mut props = Metadata::new();
+                    if let Some(doc) = &field.doc {
+                        props.insert("avro::doc".to_string(), doc.clone());
+                    }
+                    schema_to_field(&field.schema, Some(&field.name), props)
+                })
+                .collect::<Result<_>>()?;
+            DataType::Struct(fields)
+        },
+        AvroSchema::Enum { .. } => {
+            return Ok(Field::new(
+                name.unwrap_or_default(),
+                DataType::Dictionary(IntegerType::Int32, Box::new(DataType::Utf8), false),
+                false,
+            ))
+        },
+        AvroSchema::Fixed(Fixed { size, logical, .. }) => match logical {
+            Some(logical) => match logical {
+                avro_schema::schema::FixedLogical::Decimal(precision, scale) => {
+                    DataType::Decimal(*precision, *scale)
+                },
+                avro_schema::schema::FixedLogical::Duration => {
+                    DataType::Interval(IntervalUnit::MonthDayNano)
+                },
+            },
+            None => DataType::FixedSizeBinary(*size),
+        },
+    };
+
+    let name = name.unwrap_or_default();
+
+    Ok(Field::new(name, data_type, nullable).with_metadata(props))
+}
diff --git a/crates/nano-arrow/src/io/avro/read/util.rs b/crates/nano-arrow/src/io/avro/read/util.rs
new file mode 100644
index 000000000000..a26ee0e005ee
--- /dev/null
+++ b/crates/nano-arrow/src/io/avro/read/util.rs
@@ -0,0 +1,17 @@
+use std::io::Read;
+
+use super::super::avro_decode;
+use crate::error::{Error, Result};
+
+pub fn zigzag_i64<R: Read>(reader: &mut R) -> Result<i64> {
+    let z = decode_variable(reader)?;
+    Ok(if z & 0x1 == 0 {
+        (z >> 1) as i64
+    } else {
+        !(z >> 1) as i64
+    })
+}
+
+fn decode_variable<R: Read>(reader: &mut R) -> Result<u64> {
+    avro_decode!(reader)
+}
diff --git a/crates/nano-arrow/src/io/avro/write/mod.rs b/crates/nano-arrow/src/io/avro/write/mod.rs
new file mode 100644
index 000000000000..6448782bb44e
--- /dev/null
+++ b/crates/nano-arrow/src/io/avro/write/mod.rs
@@ -0,0 +1,28 @@
+//! APIs to write to Avro format.
+use avro_schema::file::Block;
+
+mod schema;
+pub use schema::to_record;
+mod serialize;
+pub use serialize::{can_serialize, new_serializer, BoxSerializer};
+
+/// consumes a set of [`BoxSerializer`] into an [`Block`].
+/// # Panics
+/// Panics iff the number of items in any of the serializers is not equal to the number of rows
+/// declared in the `block`.
+pub fn serialize(serializers: &mut [BoxSerializer], block: &mut Block) {
+    let Block {
+        data,
+        number_of_rows,
+    } = block;
+
+    data.clear(); // restart it
+
+    // _the_ transpose (columns -> rows)
+    for _ in 0..*number_of_rows {
+        for serializer in &mut *serializers {
+            let item_data = serializer.next().unwrap();
+            data.extend(item_data);
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/io/avro/write/schema.rs b/crates/nano-arrow/src/io/avro/write/schema.rs
new file mode 100644
index 000000000000..b81cdc77ce3a
--- /dev/null
+++ b/crates/nano-arrow/src/io/avro/write/schema.rs
@@ -0,0 +1,91 @@
+use avro_schema::schema::{
+    BytesLogical, Field as AvroField, Fixed, FixedLogical, IntLogical, LongLogical, Record,
+    Schema as AvroSchema,
+};
+
+use crate::datatypes::*;
+use crate::error::{Error, Result};
+
+/// Converts a [`Schema`] to an Avro [`Record`].
+pub fn to_record(schema: &Schema) -> Result<Record> {
+    let mut name_counter: i32 = 0;
+    let fields = schema
+        .fields
+        .iter()
+        .map(|f| field_to_field(f, &mut name_counter))
+        .collect::<Result<_>>()?;
+    Ok(Record {
+        name: "".to_string(),
+        namespace: None,
+        doc: None,
+        aliases: vec![],
+        fields,
+    })
+}
+
+fn field_to_field(field: &Field, name_counter: &mut i32) -> Result<AvroField> {
+    let schema = type_to_schema(field.data_type(), field.is_nullable, name_counter)?;
+    Ok(AvroField::new(&field.name, schema))
+}
+
+fn type_to_schema(
+    data_type: &DataType,
+    is_nullable: bool,
+    name_counter: &mut i32,
+) -> Result<AvroSchema> {
+    Ok(if is_nullable {
+        AvroSchema::Union(vec![
+            AvroSchema::Null,
+            _type_to_schema(data_type, name_counter)?,
+        ])
+    } else {
+        _type_to_schema(data_type, name_counter)?
+    })
+}
+
+fn _get_field_name(name_counter: &mut i32) -> String {
+    *name_counter += 1;
+    format!("r{name_counter}")
+}
+
+fn _type_to_schema(data_type: &DataType, name_counter: &mut i32) -> Result<AvroSchema> {
+    Ok(match data_type.to_logical_type() {
+        DataType::Null => AvroSchema::Null,
+        DataType::Boolean => AvroSchema::Boolean,
+        DataType::Int32 => AvroSchema::Int(None),
+        DataType::Int64 => AvroSchema::Long(None),
+        DataType::Float32 => AvroSchema::Float,
+        DataType::Float64 => AvroSchema::Double,
+        DataType::Binary => AvroSchema::Bytes(None),
+        DataType::LargeBinary => AvroSchema::Bytes(None),
+        DataType::Utf8 => AvroSchema::String(None),
+        DataType::LargeUtf8 => AvroSchema::String(None),
+        DataType::LargeList(inner) | DataType::List(inner) => AvroSchema::Array(Box::new(
+            type_to_schema(&inner.data_type, inner.is_nullable, name_counter)?,
+        )),
+        DataType::Struct(fields) => AvroSchema::Record(Record::new(
+            _get_field_name(name_counter),
+            fields
+                .iter()
+                .map(|f| field_to_field(f, name_counter))
+                .collect::<Result<Vec<_>>>()?,
+        )),
+        DataType::Date32 => AvroSchema::Int(Some(IntLogical::Date)),
+        DataType::Time32(TimeUnit::Millisecond) => AvroSchema::Int(Some(IntLogical::Time)),
+        DataType::Time64(TimeUnit::Microsecond) => AvroSchema::Long(Some(LongLogical::Time)),
+        DataType::Timestamp(TimeUnit::Millisecond, None) => {
+            AvroSchema::Long(Some(LongLogical::LocalTimestampMillis))
+        },
+        DataType::Timestamp(TimeUnit::Microsecond, None) => {
+            AvroSchema::Long(Some(LongLogical::LocalTimestampMicros))
+        },
+        DataType::Interval(IntervalUnit::MonthDayNano) => {
+            let mut fixed = Fixed::new("", 12);
+            fixed.logical = Some(FixedLogical::Duration);
+            AvroSchema::Fixed(fixed)
+        },
+        DataType::FixedSizeBinary(size) => AvroSchema::Fixed(Fixed::new("", *size)),
+        DataType::Decimal(p, s) => AvroSchema::Bytes(Some(BytesLogical::Decimal(*p, *s))),
+        other => return Err(Error::NotYetImplemented(format!("write {other:?} to avro"))),
+    })
+}
diff --git a/crates/nano-arrow/src/io/avro/write/serialize.rs b/crates/nano-arrow/src/io/avro/write/serialize.rs
new file mode 100644
index 000000000000..888861db376a
--- /dev/null
+++ b/crates/nano-arrow/src/io/avro/write/serialize.rs
@@ -0,0 +1,535 @@
+use avro_schema::schema::{Record, Schema as AvroSchema};
+use avro_schema::write::encode;
+
+use super::super::super::iterator::*;
+use crate::array::*;
+use crate::bitmap::utils::ZipValidity;
+use crate::datatypes::{DataType, IntervalUnit, PhysicalType, PrimitiveType};
+use crate::offset::Offset;
+use crate::types::months_days_ns;
+
+// Zigzag representation of false and true respectively.
+const IS_NULL: u8 = 0;
+const IS_VALID: u8 = 2;
+
+/// A type alias for a boxed [`StreamingIterator`], used to write arrays into avro rows
+/// (i.e. a column -> row transposition of types known at run-time)
+pub type BoxSerializer<'a> = Box<dyn StreamingIterator<Item = [u8]> + 'a + Send + Sync>;
+
+fn utf8_required<O: Offset>(array: &Utf8Array<O>) -> BoxSerializer {
+    Box::new(BufStreamingIterator::new(
+        array.values_iter(),
+        |x, buf| {
+            encode::zigzag_encode(x.len() as i64, buf).unwrap();
+            buf.extend_from_slice(x.as_bytes());
+        },
+        vec![],
+    ))
+}
+
+fn utf8_optional<O: Offset>(array: &Utf8Array<O>) -> BoxSerializer {
+    Box::new(BufStreamingIterator::new(
+        array.iter(),
+        |x, buf| {
+            if let Some(x) = x {
+                buf.push(IS_VALID);
+                encode::zigzag_encode(x.len() as i64, buf).unwrap();
+                buf.extend_from_slice(x.as_bytes());
+            } else {
+                buf.push(IS_NULL);
+            }
+        },
+        vec![],
+    ))
+}
+
+fn binary_required<O: Offset>(array: &BinaryArray<O>) -> BoxSerializer {
+    Box::new(BufStreamingIterator::new(
+        array.values_iter(),
+        |x, buf| {
+            encode::zigzag_encode(x.len() as i64, buf).unwrap();
+            buf.extend_from_slice(x);
+        },
+        vec![],
+    ))
+}
+
+fn binary_optional<O: Offset>(array: &BinaryArray<O>) -> BoxSerializer {
+    Box::new(BufStreamingIterator::new(
+        array.iter(),
+        |x, buf| {
+            if let Some(x) = x {
+                buf.push(IS_VALID);
+                encode::zigzag_encode(x.len() as i64, buf).unwrap();
+                buf.extend_from_slice(x);
+            } else {
+                buf.push(IS_NULL);
+            }
+        },
+        vec![],
+    ))
+}
+
+fn fixed_size_binary_required(array: &FixedSizeBinaryArray) -> BoxSerializer {
+    Box::new(BufStreamingIterator::new(
+        array.values_iter(),
+        |x, buf| {
+            buf.extend_from_slice(x);
+        },
+        vec![],
+    ))
+}
+
+fn fixed_size_binary_optional(array: &FixedSizeBinaryArray) -> BoxSerializer {
+    Box::new(BufStreamingIterator::new(
+        array.iter(),
+        |x, buf| {
+            if let Some(x) = x {
+                buf.push(IS_VALID);
+                buf.extend_from_slice(x);
+            } else {
+                buf.push(IS_NULL);
+            }
+        },
+        vec![],
+    ))
+}
+
+fn list_required<'a, O: Offset>(array: &'a ListArray<O>, schema: &AvroSchema) -> BoxSerializer<'a> {
+    let mut inner = new_serializer(array.values().as_ref(), schema);
+    let lengths = array
+        .offsets()
+        .buffer()
+        .windows(2)
+        .map(|w| (w[1] - w[0]).to_usize() as i64);
+
+    Box::new(BufStreamingIterator::new(
+        lengths,
+        move |length, buf| {
+            encode::zigzag_encode(length, buf).unwrap();
+            let mut rows = 0;
+            while let Some(item) = inner.next() {
+                buf.extend_from_slice(item);
+                rows += 1;
+                if rows == length {
+                    encode::zigzag_encode(0, buf).unwrap();
+                    break;
+                }
+            }
+        },
+        vec![],
+    ))
+}
+
+fn list_optional<'a, O: Offset>(array: &'a ListArray<O>, schema: &AvroSchema) -> BoxSerializer<'a> {
+    let mut inner = new_serializer(array.values().as_ref(), schema);
+    let lengths = array
+        .offsets()
+        .buffer()
+        .windows(2)
+        .map(|w| (w[1] - w[0]).to_usize() as i64);
+    let lengths = ZipValidity::new_with_validity(lengths, array.validity());
+
+    Box::new(BufStreamingIterator::new(
+        lengths,
+        move |length, buf| {
+            if let Some(length) = length {
+                buf.push(IS_VALID);
+                encode::zigzag_encode(length, buf).unwrap();
+                let mut rows = 0;
+                while let Some(item) = inner.next() {
+                    buf.extend_from_slice(item);
+                    rows += 1;
+                    if rows == length {
+                        encode::zigzag_encode(0, buf).unwrap();
+                        break;
+                    }
+                }
+            } else {
+                buf.push(IS_NULL);
+            }
+        },
+        vec![],
+    ))
+}
+
+fn struct_required<'a>(array: &'a StructArray, schema: &Record) -> BoxSerializer<'a> {
+    let schemas = schema.fields.iter().map(|x| &x.schema);
+    let mut inner = array
+        .values()
+        .iter()
+        .zip(schemas)
+        .map(|(x, schema)| new_serializer(x.as_ref(), schema))
+        .collect::<Vec<_>>();
+
+    Box::new(BufStreamingIterator::new(
+        0..array.len(),
+        move |_, buf| {
+            inner
+                .iter_mut()
+                .for_each(|item| buf.extend_from_slice(item.next().unwrap()))
+        },
+        vec![],
+    ))
+}
+
+fn struct_optional<'a>(array: &'a StructArray, schema: &Record) -> BoxSerializer<'a> {
+    let schemas = schema.fields.iter().map(|x| &x.schema);
+    let mut inner = array
+        .values()
+        .iter()
+        .zip(schemas)
+        .map(|(x, schema)| new_serializer(x.as_ref(), schema))
+        .collect::<Vec<_>>();
+
+    let iterator = ZipValidity::new_with_validity(0..array.len(), array.validity());
+
+    Box::new(BufStreamingIterator::new(
+        iterator,
+        move |maybe, buf| {
+            if maybe.is_some() {
+                buf.push(IS_VALID);
+                inner
+                    .iter_mut()
+                    .for_each(|item| buf.extend_from_slice(item.next().unwrap()))
+            } else {
+                buf.push(IS_NULL);
+                // skip the item
+                inner.iter_mut().for_each(|item| {
+                    let _ = item.next().unwrap();
+                });
+            }
+        },
+        vec![],
+    ))
+}
+
+/// Creates a [`StreamingIterator`] trait object that presents items from `array`
+/// encoded according to `schema`.
+/// # Panic
+/// This function panics iff the `data_type` is not supported (use [`can_serialize`] to check)
+/// # Implementation
+/// This function performs minimal CPU work: it dynamically dispatches based on the schema
+/// and arrow type.
+pub fn new_serializer<'a>(array: &'a dyn Array, schema: &AvroSchema) -> BoxSerializer<'a> {
+    let data_type = array.data_type().to_physical_type();
+
+    match (data_type, schema) {
+        (PhysicalType::Boolean, AvroSchema::Boolean) => {
+            let values = array.as_any().downcast_ref::<BooleanArray>().unwrap();
+            Box::new(BufStreamingIterator::new(
+                values.values_iter(),
+                |x, buf| {
+                    buf.push(x as u8);
+                },
+                vec![],
+            ))
+        },
+        (PhysicalType::Boolean, AvroSchema::Union(_)) => {
+            let values = array.as_any().downcast_ref::<BooleanArray>().unwrap();
+            Box::new(BufStreamingIterator::new(
+                values.iter(),
+                |x, buf| {
+                    if let Some(x) = x {
+                        buf.extend_from_slice(&[IS_VALID, x as u8]);
+                    } else {
+                        buf.push(IS_NULL);
+                    }
+                },
+                vec![],
+            ))
+        },
+        (PhysicalType::Utf8, AvroSchema::Union(_)) => {
+            utf8_optional::<i32>(array.as_any().downcast_ref().unwrap())
+        },
+        (PhysicalType::LargeUtf8, AvroSchema::Union(_)) => {
+            utf8_optional::<i64>(array.as_any().downcast_ref().unwrap())
+        },
+        (PhysicalType::Utf8, AvroSchema::String(_)) => {
+            utf8_required::<i32>(array.as_any().downcast_ref().unwrap())
+        },
+        (PhysicalType::LargeUtf8, AvroSchema::String(_)) => {
+            utf8_required::<i64>(array.as_any().downcast_ref().unwrap())
+        },
+        (PhysicalType::Binary, AvroSchema::Union(_)) => {
+            binary_optional::<i32>(array.as_any().downcast_ref().unwrap())
+        },
+        (PhysicalType::LargeBinary, AvroSchema::Union(_)) => {
+            binary_optional::<i64>(array.as_any().downcast_ref().unwrap())
+        },
+        (PhysicalType::FixedSizeBinary, AvroSchema::Union(_)) => {
+            fixed_size_binary_optional(array.as_any().downcast_ref().unwrap())
+        },
+        (PhysicalType::Binary, AvroSchema::Bytes(_)) => {
+            binary_required::<i32>(array.as_any().downcast_ref().unwrap())
+        },
+        (PhysicalType::LargeBinary, AvroSchema::Bytes(_)) => {
+            binary_required::<i64>(array.as_any().downcast_ref().unwrap())
+        },
+        (PhysicalType::FixedSizeBinary, AvroSchema::Fixed(_)) => {
+            fixed_size_binary_required(array.as_any().downcast_ref().unwrap())
+        },
+
+        (PhysicalType::Primitive(PrimitiveType::Int32), AvroSchema::Union(_)) => {
+            let values = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<i32>>()
+                .unwrap();
+            Box::new(BufStreamingIterator::new(
+                values.iter(),
+                |x, buf| {
+                    if let Some(x) = x {
+                        buf.push(IS_VALID);
+                        encode::zigzag_encode(*x as i64, buf).unwrap();
+                    } else {
+                        buf.push(IS_NULL);
+                    }
+                },
+                vec![],
+            ))
+        },
+        (PhysicalType::Primitive(PrimitiveType::Int32), AvroSchema::Int(_)) => {
+            let values = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<i32>>()
+                .unwrap();
+            Box::new(BufStreamingIterator::new(
+                values.values().iter(),
+                |x, buf| {
+                    encode::zigzag_encode(*x as i64, buf).unwrap();
+                },
+                vec![],
+            ))
+        },
+        (PhysicalType::Primitive(PrimitiveType::Int64), AvroSchema::Union(_)) => {
+            let values = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<i64>>()
+                .unwrap();
+            Box::new(BufStreamingIterator::new(
+                values.iter(),
+                |x, buf| {
+                    if let Some(x) = x {
+                        buf.push(IS_VALID);
+                        encode::zigzag_encode(*x, buf).unwrap();
+                    } else {
+                        buf.push(IS_NULL);
+                    }
+                },
+                vec![],
+            ))
+        },
+        (PhysicalType::Primitive(PrimitiveType::Int64), AvroSchema::Long(_)) => {
+            let values = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<i64>>()
+                .unwrap();
+            Box::new(BufStreamingIterator::new(
+                values.values().iter(),
+                |x, buf| {
+                    encode::zigzag_encode(*x, buf).unwrap();
+                },
+                vec![],
+            ))
+        },
+        (PhysicalType::Primitive(PrimitiveType::Float32), AvroSchema::Union(_)) => {
+            let values = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<f32>>()
+                .unwrap();
+            Box::new(BufStreamingIterator::new(
+                values.iter(),
+                |x, buf| {
+                    if let Some(x) = x {
+                        buf.push(IS_VALID);
+                        buf.extend(x.to_le_bytes())
+                    } else {
+                        buf.push(IS_NULL);
+                    }
+                },
+                vec![],
+            ))
+        },
+        (PhysicalType::Primitive(PrimitiveType::Float32), AvroSchema::Float) => {
+            let values = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<f32>>()
+                .unwrap();
+            Box::new(BufStreamingIterator::new(
+                values.values().iter(),
+                |x, buf| {
+                    buf.extend_from_slice(&x.to_le_bytes());
+                },
+                vec![],
+            ))
+        },
+        (PhysicalType::Primitive(PrimitiveType::Float64), AvroSchema::Union(_)) => {
+            let values = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<f64>>()
+                .unwrap();
+            Box::new(BufStreamingIterator::new(
+                values.iter(),
+                |x, buf| {
+                    if let Some(x) = x {
+                        buf.push(IS_VALID);
+                        buf.extend(x.to_le_bytes())
+                    } else {
+                        buf.push(IS_NULL);
+                    }
+                },
+                vec![],
+            ))
+        },
+        (PhysicalType::Primitive(PrimitiveType::Float64), AvroSchema::Double) => {
+            let values = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<f64>>()
+                .unwrap();
+            Box::new(BufStreamingIterator::new(
+                values.values().iter(),
+                |x, buf| {
+                    buf.extend_from_slice(&x.to_le_bytes());
+                },
+                vec![],
+            ))
+        },
+        (PhysicalType::Primitive(PrimitiveType::Int128), AvroSchema::Bytes(_)) => {
+            let values = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<i128>>()
+                .unwrap();
+            Box::new(BufStreamingIterator::new(
+                values.values().iter(),
+                |x, buf| {
+                    let len = ((x.leading_zeros() / 8) - ((x.leading_zeros() / 8) % 2)) as usize;
+                    encode::zigzag_encode((16 - len) as i64, buf).unwrap();
+                    buf.extend_from_slice(&x.to_be_bytes()[len..]);
+                },
+                vec![],
+            ))
+        },
+        (PhysicalType::Primitive(PrimitiveType::Int128), AvroSchema::Union(_)) => {
+            let values = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<i128>>()
+                .unwrap();
+            Box::new(BufStreamingIterator::new(
+                values.iter(),
+                |x, buf| {
+                    if let Some(x) = x {
+                        buf.push(IS_VALID);
+                        let len =
+                            ((x.leading_zeros() / 8) - ((x.leading_zeros() / 8) % 2)) as usize;
+                        encode::zigzag_encode((16 - len) as i64, buf).unwrap();
+                        buf.extend_from_slice(&x.to_be_bytes()[len..]);
+                    } else {
+                        buf.push(IS_NULL);
+                    }
+                },
+                vec![],
+            ))
+        },
+        (PhysicalType::Primitive(PrimitiveType::MonthDayNano), AvroSchema::Fixed(_)) => {
+            let values = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<months_days_ns>>()
+                .unwrap();
+            Box::new(BufStreamingIterator::new(
+                values.values().iter(),
+                interval_write,
+                vec![],
+            ))
+        },
+        (PhysicalType::Primitive(PrimitiveType::MonthDayNano), AvroSchema::Union(_)) => {
+            let values = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<months_days_ns>>()
+                .unwrap();
+            Box::new(BufStreamingIterator::new(
+                values.iter(),
+                |x, buf| {
+                    if let Some(x) = x {
+                        buf.push(IS_VALID);
+                        interval_write(x, buf)
+                    } else {
+                        buf.push(IS_NULL);
+                    }
+                },
+                vec![],
+            ))
+        },
+
+        (PhysicalType::List, AvroSchema::Array(schema)) => {
+            list_required::<i32>(array.as_any().downcast_ref().unwrap(), schema.as_ref())
+        },
+        (PhysicalType::LargeList, AvroSchema::Array(schema)) => {
+            list_required::<i64>(array.as_any().downcast_ref().unwrap(), schema.as_ref())
+        },
+        (PhysicalType::List, AvroSchema::Union(inner)) => {
+            let schema = if let AvroSchema::Array(schema) = &inner[1] {
+                schema.as_ref()
+            } else {
+                unreachable!("The schema declaration does not match the deserialization")
+            };
+            list_optional::<i32>(array.as_any().downcast_ref().unwrap(), schema)
+        },
+        (PhysicalType::LargeList, AvroSchema::Union(inner)) => {
+            let schema = if let AvroSchema::Array(schema) = &inner[1] {
+                schema.as_ref()
+            } else {
+                unreachable!("The schema declaration does not match the deserialization")
+            };
+            list_optional::<i64>(array.as_any().downcast_ref().unwrap(), schema)
+        },
+        (PhysicalType::Struct, AvroSchema::Record(inner)) => {
+            struct_required(array.as_any().downcast_ref().unwrap(), inner)
+        },
+        (PhysicalType::Struct, AvroSchema::Union(inner)) => {
+            let inner = if let AvroSchema::Record(inner) = &inner[1] {
+                inner
+            } else {
+                unreachable!("The schema declaration does not match the deserialization")
+            };
+            struct_optional(array.as_any().downcast_ref().unwrap(), inner)
+        },
+        (a, b) => todo!("{:?} -> {:?} not supported", a, b),
+    }
+}
+
+/// Whether [`new_serializer`] supports `data_type`.
+pub fn can_serialize(data_type: &DataType) -> bool {
+    use DataType::*;
+    match data_type.to_logical_type() {
+        List(inner) => return can_serialize(&inner.data_type),
+        LargeList(inner) => return can_serialize(&inner.data_type),
+        Struct(inner) => return inner.iter().all(|inner| can_serialize(&inner.data_type)),
+        _ => {},
+    };
+
+    matches!(
+        data_type,
+        Boolean
+            | Int32
+            | Int64
+            | Float32
+            | Float64
+            | Decimal(_, _)
+            | Utf8
+            | Binary
+            | FixedSizeBinary(_)
+            | LargeUtf8
+            | LargeBinary
+            | Interval(IntervalUnit::MonthDayNano)
+    )
+}
+
+#[inline]
+fn interval_write(x: &months_days_ns, buf: &mut Vec<u8>) {
+    // https://avro.apache.org/docs/current/spec.html#Duration
+    // 12 bytes, months, days, millis in LE
+    buf.reserve(12);
+    buf.extend(x.months().to_le_bytes());
+    buf.extend(x.days().to_le_bytes());
+    buf.extend(((x.ns() / 1_000_000) as i32).to_le_bytes());
+}
diff --git a/crates/nano-arrow/src/io/flight/mod.rs b/crates/nano-arrow/src/io/flight/mod.rs
new file mode 100644
index 000000000000..0cce1774568f
--- /dev/null
+++ b/crates/nano-arrow/src/io/flight/mod.rs
@@ -0,0 +1,243 @@
+//! Serialization and deserialization to Arrow's flight protocol
+
+use arrow_format::flight::data::{FlightData, SchemaResult};
+use arrow_format::ipc;
+use arrow_format::ipc::planus::ReadAsRoot;
+
+use super::ipc::read::Dictionaries;
+pub use super::ipc::write::default_ipc_fields;
+use super::ipc::{IpcField, IpcSchema};
+use crate::array::Array;
+use crate::chunk::Chunk;
+use crate::datatypes::*;
+use crate::error::{Error, Result};
+pub use crate::io::ipc::write::common::WriteOptions;
+use crate::io::ipc::write::common::{encode_chunk, DictionaryTracker, EncodedData};
+use crate::io::ipc::{read, write};
+
+/// Serializes [`Chunk`] to a vector of [`FlightData`] representing the serialized dictionaries
+/// and a [`FlightData`] representing the batch.
+/// # Errors
+/// This function errors iff `fields` is not consistent with `columns`
+pub fn serialize_batch(
+    chunk: &Chunk<Box<dyn Array>>,
+    fields: &[IpcField],
+    options: &WriteOptions,
+) -> Result<(Vec<FlightData>, FlightData)> {
+    if fields.len() != chunk.arrays().len() {
+        return Err(Error::InvalidArgumentError("The argument `fields` must be consistent with the columns' schema. Use e.g. &arrow2::io::flight::default_ipc_fields(&schema.fields)".to_string()));
+    }
+
+    let mut dictionary_tracker = DictionaryTracker {
+        dictionaries: Default::default(),
+        cannot_replace: false,
+    };
+
+    let (encoded_dictionaries, encoded_batch) =
+        encode_chunk(chunk, fields, &mut dictionary_tracker, options)
+            .expect("DictionaryTracker configured above to not error on replacement");
+
+    let flight_dictionaries = encoded_dictionaries.into_iter().map(Into::into).collect();
+    let flight_batch = encoded_batch.into();
+
+    Ok((flight_dictionaries, flight_batch))
+}
+
+impl From<EncodedData> for FlightData {
+    fn from(data: EncodedData) -> Self {
+        FlightData {
+            data_header: data.ipc_message,
+            data_body: data.arrow_data,
+            ..Default::default()
+        }
+    }
+}
+
+/// Serializes a [`Schema`] to [`SchemaResult`].
+pub fn serialize_schema_to_result(
+    schema: &Schema,
+    ipc_fields: Option<&[IpcField]>,
+) -> SchemaResult {
+    SchemaResult {
+        schema: _serialize_schema(schema, ipc_fields),
+    }
+}
+
+/// Serializes a [`Schema`] to [`FlightData`].
+pub fn serialize_schema(schema: &Schema, ipc_fields: Option<&[IpcField]>) -> FlightData {
+    FlightData {
+        data_header: _serialize_schema(schema, ipc_fields),
+        ..Default::default()
+    }
+}
+
+/// Convert a [`Schema`] to bytes in the format expected in [`arrow_format::flight::data::FlightInfo`].
+pub fn serialize_schema_to_info(
+    schema: &Schema,
+    ipc_fields: Option<&[IpcField]>,
+) -> Result<Vec<u8>> {
+    let encoded_data = if let Some(ipc_fields) = ipc_fields {
+        schema_as_encoded_data(schema, ipc_fields)
+    } else {
+        let ipc_fields = default_ipc_fields(&schema.fields);
+        schema_as_encoded_data(schema, &ipc_fields)
+    };
+
+    let mut schema = vec![];
+    write::common_sync::write_message(&mut schema, &encoded_data)?;
+    Ok(schema)
+}
+
+fn _serialize_schema(schema: &Schema, ipc_fields: Option<&[IpcField]>) -> Vec<u8> {
+    if let Some(ipc_fields) = ipc_fields {
+        write::schema_to_bytes(schema, ipc_fields)
+    } else {
+        let ipc_fields = default_ipc_fields(&schema.fields);
+        write::schema_to_bytes(schema, &ipc_fields)
+    }
+}
+
+fn schema_as_encoded_data(schema: &Schema, ipc_fields: &[IpcField]) -> EncodedData {
+    EncodedData {
+        ipc_message: write::schema_to_bytes(schema, ipc_fields),
+        arrow_data: vec![],
+    }
+}
+
+/// Deserialize an IPC message into [`Schema`], [`IpcSchema`].
+/// Use to deserialize [`FlightData::data_header`] and [`SchemaResult::schema`].
+pub fn deserialize_schemas(bytes: &[u8]) -> Result<(Schema, IpcSchema)> {
+    read::deserialize_schema(bytes)
+}
+
+/// Deserializes [`FlightData`] representing a record batch message to [`Chunk`].
+pub fn deserialize_batch(
+    data: &FlightData,
+    fields: &[Field],
+    ipc_schema: &IpcSchema,
+    dictionaries: &read::Dictionaries,
+) -> Result<Chunk<Box<dyn Array>>> {
+    // check that the data_header is a record batch message
+    let message = arrow_format::ipc::MessageRef::read_as_root(&data.data_header)
+        .map_err(|err| Error::OutOfSpec(format!("Unable to get root as message: {err:?}")))?;
+
+    let length = data.data_body.len();
+    let mut reader = std::io::Cursor::new(&data.data_body);
+
+    match message.header()?.ok_or_else(|| {
+        Error::oos("Unable to convert flight data header to a record batch".to_string())
+    })? {
+        ipc::MessageHeaderRef::RecordBatch(batch) => read::read_record_batch(
+            batch,
+            fields,
+            ipc_schema,
+            None,
+            None,
+            dictionaries,
+            message.version()?,
+            &mut reader,
+            0,
+            length as u64,
+            &mut Default::default(),
+        ),
+        _ => Err(Error::nyi(
+            "flight currently only supports reading RecordBatch messages",
+        )),
+    }
+}
+
+/// Deserializes [`FlightData`], assuming it to be a dictionary message, into `dictionaries`.
+pub fn deserialize_dictionary(
+    data: &FlightData,
+    fields: &[Field],
+    ipc_schema: &IpcSchema,
+    dictionaries: &mut read::Dictionaries,
+) -> Result<()> {
+    let message = ipc::MessageRef::read_as_root(&data.data_header)?;
+
+    let chunk = if let ipc::MessageHeaderRef::DictionaryBatch(chunk) = message
+        .header()?
+        .ok_or_else(|| Error::oos("Header is required"))?
+    {
+        chunk
+    } else {
+        return Ok(());
+    };
+
+    let length = data.data_body.len();
+    let mut reader = std::io::Cursor::new(&data.data_body);
+    read::read_dictionary(
+        chunk,
+        fields,
+        ipc_schema,
+        dictionaries,
+        &mut reader,
+        0,
+        length as u64,
+        &mut Default::default(),
+    )?;
+
+    Ok(())
+}
+
+/// Deserializes [`FlightData`] into either a [`Chunk`] (when the message is a record batch)
+/// or by upserting into `dictionaries` (when the message is a dictionary)
+pub fn deserialize_message(
+    data: &FlightData,
+    fields: &[Field],
+    ipc_schema: &IpcSchema,
+    dictionaries: &mut Dictionaries,
+) -> Result<Option<Chunk<Box<dyn Array>>>> {
+    let FlightData {
+        data_header,
+        data_body,
+        ..
+    } = data;
+
+    let message = arrow_format::ipc::MessageRef::read_as_root(data_header)?;
+    let header = message
+        .header()?
+        .ok_or_else(|| Error::oos("IPC Message must contain a header"))?;
+
+    match header {
+        ipc::MessageHeaderRef::RecordBatch(batch) => {
+            let length = data_body.len();
+            let mut reader = std::io::Cursor::new(data_body);
+
+            let chunk = read::read_record_batch(
+                batch,
+                fields,
+                ipc_schema,
+                None,
+                None,
+                dictionaries,
+                arrow_format::ipc::MetadataVersion::V5,
+                &mut reader,
+                0,
+                length as u64,
+                &mut Default::default(),
+            )?;
+
+            Ok(chunk.into())
+        },
+        ipc::MessageHeaderRef::DictionaryBatch(dict_batch) => {
+            let length = data_body.len();
+            let mut reader = std::io::Cursor::new(data_body);
+
+            read::read_dictionary(
+                dict_batch,
+                fields,
+                ipc_schema,
+                dictionaries,
+                &mut reader,
+                0,
+                length as u64,
+                &mut Default::default(),
+            )?;
+            Ok(None)
+        },
+        t => Err(Error::nyi(format!(
+            "Reading types other than record batches not yet supported, unable to read {t:?}"
+        ))),
+    }
+}
diff --git a/crates/nano-arrow/src/io/ipc/append/mod.rs b/crates/nano-arrow/src/io/ipc/append/mod.rs
new file mode 100644
index 000000000000..1acb39a931ef
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/append/mod.rs
@@ -0,0 +1,72 @@
+//! A struct adapter of Read+Seek+Write to append to IPC files
+// read header and convert to writer information
+// seek to first byte of header - 1
+// write new batch
+// write new footer
+use std::io::{Read, Seek, SeekFrom, Write};
+
+use super::endianness::is_native_little_endian;
+use super::read::{self, FileMetadata};
+use super::write::common::DictionaryTracker;
+use super::write::writer::*;
+use super::write::*;
+use crate::error::{Error, Result};
+
+impl<R: Read + Seek + Write> FileWriter<R> {
+    /// Creates a new [`FileWriter`] from an existing file, seeking to the last message
+    /// and appending new messages afterwards. Users call `finish` to write the footer (with both)
+    /// the existing and appended messages on it.
+    /// # Error
+    /// This function errors iff:
+    /// * the file's endianness is not the native endianness (not yet supported)
+    /// * the file is not a valid Arrow IPC file
+    pub fn try_from_file(
+        mut writer: R,
+        metadata: FileMetadata,
+        options: WriteOptions,
+    ) -> Result<FileWriter<R>> {
+        if metadata.ipc_schema.is_little_endian != is_native_little_endian() {
+            return Err(Error::nyi(
+                "Appending to a file of a non-native endianness is still not supported",
+            ));
+        }
+
+        let dictionaries =
+            read::read_file_dictionaries(&mut writer, &metadata, &mut Default::default())?;
+
+        let last_block = metadata.blocks.last().ok_or_else(|| {
+            Error::oos("An Arrow IPC file must have at least 1 message (the schema message)")
+        })?;
+        let offset: u64 = last_block
+            .offset
+            .try_into()
+            .map_err(|_| Error::oos("The block's offset must be a positive number"))?;
+        let meta_data_length: u64 = last_block
+            .meta_data_length
+            .try_into()
+            .map_err(|_| Error::oos("The block's meta length must be a positive number"))?;
+        let body_length: u64 = last_block
+            .body_length
+            .try_into()
+            .map_err(|_| Error::oos("The block's body length must be a positive number"))?;
+        let offset: u64 = offset + meta_data_length + body_length;
+
+        writer.seek(SeekFrom::Start(offset))?;
+
+        Ok(FileWriter {
+            writer,
+            options,
+            schema: metadata.schema,
+            ipc_fields: metadata.ipc_schema.fields,
+            block_offsets: offset as usize,
+            dictionary_blocks: metadata.dictionaries.unwrap_or_default(),
+            record_blocks: metadata.blocks,
+            state: State::Started, // file already exists, so we are ready
+            dictionary_tracker: DictionaryTracker {
+                dictionaries,
+                cannot_replace: true,
+            },
+            encoded_message: Default::default(),
+        })
+    }
+}
diff --git a/crates/nano-arrow/src/io/ipc/compression.rs b/crates/nano-arrow/src/io/ipc/compression.rs
new file mode 100644
index 000000000000..9a69deb8248a
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/compression.rs
@@ -0,0 +1,91 @@
+use crate::error::Result;
+
+#[cfg(feature = "io_ipc_compression")]
+#[cfg_attr(docsrs, doc(cfg(feature = "io_ipc_compression")))]
+pub fn decompress_lz4(input_buf: &[u8], output_buf: &mut [u8]) -> Result<()> {
+    use std::io::Read;
+    let mut decoder = lz4::Decoder::new(input_buf)?;
+    decoder.read_exact(output_buf).map_err(|e| e.into())
+}
+
+#[cfg(feature = "io_ipc_compression")]
+#[cfg_attr(docsrs, doc(cfg(feature = "io_ipc_compression")))]
+pub fn decompress_zstd(input_buf: &[u8], output_buf: &mut [u8]) -> Result<()> {
+    use std::io::Read;
+    let mut decoder = zstd::Decoder::new(input_buf)?;
+    decoder.read_exact(output_buf).map_err(|e| e.into())
+}
+
+#[cfg(not(feature = "io_ipc_compression"))]
+pub fn decompress_lz4(_input_buf: &[u8], _output_buf: &mut [u8]) -> Result<()> {
+    use crate::error::Error;
+    Err(Error::OutOfSpec("The crate was compiled without IPC compression. Use `io_ipc_compression` to read compressed IPC.".to_string()))
+}
+
+#[cfg(not(feature = "io_ipc_compression"))]
+pub fn decompress_zstd(_input_buf: &[u8], _output_buf: &mut [u8]) -> Result<()> {
+    use crate::error::Error;
+    Err(Error::OutOfSpec("The crate was compiled without IPC compression. Use `io_ipc_compression` to read compressed IPC.".to_string()))
+}
+
+#[cfg(feature = "io_ipc_compression")]
+#[cfg_attr(docsrs, doc(cfg(feature = "io_ipc_compression")))]
+pub fn compress_lz4(input_buf: &[u8], output_buf: &mut Vec<u8>) -> Result<()> {
+    use std::io::Write;
+
+    use crate::error::Error;
+    let mut encoder = lz4::EncoderBuilder::new()
+        .build(output_buf)
+        .map_err(Error::from)?;
+    encoder.write_all(input_buf)?;
+    encoder.finish().1.map_err(|e| e.into())
+}
+
+#[cfg(feature = "io_ipc_compression")]
+#[cfg_attr(docsrs, doc(cfg(feature = "io_ipc_compression")))]
+pub fn compress_zstd(input_buf: &[u8], output_buf: &mut Vec<u8>) -> Result<()> {
+    zstd::stream::copy_encode(input_buf, output_buf, 0).map_err(|e| e.into())
+}
+
+#[cfg(not(feature = "io_ipc_compression"))]
+pub fn compress_lz4(_input_buf: &[u8], _output_buf: &[u8]) -> Result<()> {
+    use crate::error::Error;
+    Err(Error::OutOfSpec("The crate was compiled without IPC compression. Use `io_ipc_compression` to write compressed IPC.".to_string()))
+}
+
+#[cfg(not(feature = "io_ipc_compression"))]
+pub fn compress_zstd(_input_buf: &[u8], _output_buf: &[u8]) -> Result<()> {
+    use crate::error::Error;
+    Err(Error::OutOfSpec("The crate was compiled without IPC compression. Use `io_ipc_compression` to write compressed IPC.".to_string()))
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[cfg(feature = "io_ipc_compression")]
+    #[test]
+    #[cfg_attr(miri, ignore)] // ZSTD uses foreign calls that miri does not support
+    fn round_trip_zstd() {
+        let data: Vec<u8> = (0..200u8).map(|x| x % 10).collect();
+        let mut buffer = vec![];
+        compress_zstd(&data, &mut buffer).unwrap();
+
+        let mut result = vec![0; 200];
+        decompress_zstd(&buffer, &mut result).unwrap();
+        assert_eq!(data, result);
+    }
+
+    #[cfg(feature = "io_ipc_compression")]
+    #[test]
+    #[cfg_attr(miri, ignore)] // LZ4 uses foreign calls that miri does not support
+    fn round_trip_lz4() {
+        let data: Vec<u8> = (0..200u8).map(|x| x % 10).collect();
+        let mut buffer = vec![];
+        compress_lz4(&data, &mut buffer).unwrap();
+
+        let mut result = vec![0; 200];
+        decompress_lz4(&buffer, &mut result).unwrap();
+        assert_eq!(data, result);
+    }
+}
diff --git a/crates/nano-arrow/src/io/ipc/endianness.rs b/crates/nano-arrow/src/io/ipc/endianness.rs
new file mode 100644
index 000000000000..61b3f9b7c51c
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/endianness.rs
@@ -0,0 +1,11 @@
+#[cfg(target_endian = "little")]
+#[inline]
+pub fn is_native_little_endian() -> bool {
+    true
+}
+
+#[cfg(target_endian = "big")]
+#[inline]
+pub fn is_native_little_endian() -> bool {
+    false
+}
diff --git a/crates/nano-arrow/src/io/ipc/mod.rs b/crates/nano-arrow/src/io/ipc/mod.rs
new file mode 100644
index 000000000000..7da03e5c0abb
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/mod.rs
@@ -0,0 +1,104 @@
+//! APIs to read from and write to Arrow's IPC format.
+//!
+//! Inter-process communication is a method through which different processes
+//! share and pass data between them. Its use-cases include parallel
+//! processing of chunks of data across different CPU cores, transferring
+//! data between different Apache Arrow implementations in other languages and
+//! more. Under the hood Apache Arrow uses [FlatBuffers](https://google.github.io/flatbuffers/)
+//! as its binary protocol, so every Arrow-centered streaming or serialiation
+//! problem that could be solved using FlatBuffers could probably be solved
+//! using the more integrated approach that is exposed in this module.
+//!
+//! [Arrow's IPC protocol](https://arrow.apache.org/docs/format/Columnar.html#serialization-and-interprocess-communication-ipc)
+//! allows only batch or dictionary columns to be passed
+//! around due to its reliance on a pre-defined data scheme. This constraint
+//! provides a large performance gain because serialized data will always have a
+//! known structutre, i.e. the same fields and datatypes, with the only variance
+//! being the number of rows and the actual data inside the Batch. This dramatically
+//! increases the deserialization rate, as the bytes in the file or stream are already
+//! structured "correctly".
+//!
+//! Reading and writing IPC messages is done using one of two variants - either
+//! [`FileReader`](read::FileReader) <-> [`FileWriter`](struct@write::FileWriter) or
+//! [`StreamReader`](read::StreamReader) <-> [`StreamWriter`](struct@write::StreamWriter).
+//! These two variants wrap a type `T` that implements [`Read`](std::io::Read), and in
+//! the case of the `File` variant it also implements [`Seek`](std::io::Seek). In
+//! practice it means that `File`s can be arbitrarily accessed while `Stream`s are only
+//! read in certain order - the one they were written in (first in, first out).
+//!
+//! # Examples
+//! Read and write to a file:
+//! ```
+//! use arrow2::io::ipc::{{read::{FileReader, read_file_metadata}}, {write::{FileWriter, WriteOptions}}};
+//! # use std::fs::File;
+//! # use arrow2::datatypes::{Field, Schema, DataType};
+//! # use arrow2::array::{Int32Array, Array};
+//! # use arrow2::chunk::Chunk;
+//! # use arrow2::error::Error;
+//! // Setup the writer
+//! let path = "example.arrow".to_string();
+//! let mut file = File::create(&path)?;
+//! let x_coord = Field::new("x", DataType::Int32, false);
+//! let y_coord = Field::new("y", DataType::Int32, false);
+//! let schema = Schema::from(vec![x_coord, y_coord]);
+//! let options = WriteOptions {compression: None};
+//! let mut writer = FileWriter::try_new(file, schema, None, options)?;
+//!
+//! // Setup the data
+//! let x_data = Int32Array::from_slice([-1i32, 1]);
+//! let y_data = Int32Array::from_slice([1i32, -1]);
+//! let chunk = Chunk::try_new(vec![x_data.boxed(), y_data.boxed()])?;
+//!
+//! // Write the messages and finalize the stream
+//! for _ in 0..5 {
+//!     writer.write(&chunk, None);
+//! }
+//! writer.finish();
+//!
+//! // Fetch some of the data and get the reader back
+//! let mut reader = File::open(&path)?;
+//! let metadata = read_file_metadata(&mut reader)?;
+//! let mut reader = FileReader::new(reader, metadata, None, None);
+//! let row1 = reader.next().unwrap();  // [[-1, 1], [1, -1]]
+//! let row2 = reader.next().unwrap();  // [[-1, 1], [1, -1]]
+//! let mut reader = reader.into_inner();
+//! // Do more stuff with the reader, like seeking ahead.
+//! # Ok::<(), Error>(())
+//! ```
+//!
+//! For further information and examples please consult the
+//! [user guide](https://jorgecarleitao.github.io/arrow2/io/index.html).
+//! For even more examples check the `examples` folder in the main repository
+//! ([1](https://github.com/jorgecarleitao/arrow2/blob/main/examples/ipc_file_read.rs),
+//! [2](https://github.com/jorgecarleitao/arrow2/blob/main/examples/ipc_file_write.rs),
+//! [3](https://github.com/jorgecarleitao/arrow2/tree/main/examples/ipc_pyarrow)).
+
+mod compression;
+mod endianness;
+
+pub mod append;
+pub mod read;
+pub mod write;
+
+const ARROW_MAGIC_V1: [u8; 4] = [b'F', b'E', b'A', b'1'];
+const ARROW_MAGIC_V2: [u8; 6] = [b'A', b'R', b'R', b'O', b'W', b'1'];
+pub(crate) const CONTINUATION_MARKER: [u8; 4] = [0xff; 4];
+
+/// Struct containing `dictionary_id` and nested `IpcField`, allowing users
+/// to specify the dictionary ids of the IPC fields when writing to IPC.
+#[derive(Debug, Clone, PartialEq, Default)]
+pub struct IpcField {
+    /// optional children
+    pub fields: Vec<IpcField>,
+    /// dictionary id
+    pub dictionary_id: Option<i64>,
+}
+
+/// Struct containing fields and whether the file is written in little or big endian.
+#[derive(Debug, Clone, PartialEq)]
+pub struct IpcSchema {
+    /// The fields in the schema
+    pub fields: Vec<IpcField>,
+    /// Endianness of the file
+    pub is_little_endian: bool,
+}
diff --git a/crates/nano-arrow/src/io/ipc/read/array/binary.rs b/crates/nano-arrow/src/io/ipc/read/array/binary.rs
new file mode 100644
index 000000000000..52a5c4b7b7b0
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/array/binary.rs
@@ -0,0 +1,91 @@
+use std::collections::VecDeque;
+use std::io::{Read, Seek};
+
+use super::super::read_basic::*;
+use super::super::{Compression, IpcBuffer, Node, OutOfSpecKind};
+use crate::array::BinaryArray;
+use crate::buffer::Buffer;
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+use crate::offset::Offset;
+
+#[allow(clippy::too_many_arguments)]
+pub fn read_binary<O: Offset, R: Read + Seek>(
+    field_nodes: &mut VecDeque<Node>,
+    data_type: DataType,
+    buffers: &mut VecDeque<IpcBuffer>,
+    reader: &mut R,
+    block_offset: u64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+    limit: Option<usize>,
+    scratch: &mut Vec<u8>,
+) -> Result<BinaryArray<O>> {
+    let field_node = field_nodes.pop_front().ok_or_else(|| {
+        Error::oos(format!(
+            "IPC: unable to fetch the field for {data_type:?}. The file or stream is corrupted."
+        ))
+    })?;
+
+    let validity = read_validity(
+        buffers,
+        field_node,
+        reader,
+        block_offset,
+        is_little_endian,
+        compression,
+        limit,
+        scratch,
+    )?;
+
+    let length: usize = field_node
+        .length()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+    let length = limit.map(|limit| limit.min(length)).unwrap_or(length);
+
+    let offsets: Buffer<O> = read_buffer(
+        buffers,
+        1 + length,
+        reader,
+        block_offset,
+        is_little_endian,
+        compression,
+        scratch,
+    )
+    // Older versions of the IPC format sometimes do not report an offset
+    .or_else(|_| Result::Ok(Buffer::<O>::from(vec![O::default()])))?;
+
+    let last_offset = offsets.last().unwrap().to_usize();
+    let values = read_buffer(
+        buffers,
+        last_offset,
+        reader,
+        block_offset,
+        is_little_endian,
+        compression,
+        scratch,
+    )?;
+
+    BinaryArray::<O>::try_new(data_type, offsets.try_into()?, values, validity)
+}
+
+pub fn skip_binary(
+    field_nodes: &mut VecDeque<Node>,
+    buffers: &mut VecDeque<IpcBuffer>,
+) -> Result<()> {
+    let _ = field_nodes.pop_front().ok_or_else(|| {
+        Error::oos("IPC: unable to fetch the field for binary. The file or stream is corrupted.")
+    })?;
+
+    let _ = buffers
+        .pop_front()
+        .ok_or_else(|| Error::oos("IPC: missing validity buffer."))?;
+    let _ = buffers
+        .pop_front()
+        .ok_or_else(|| Error::oos("IPC: missing offsets buffer."))?;
+    let _ = buffers
+        .pop_front()
+        .ok_or_else(|| Error::oos("IPC: missing values buffer."))?;
+    Ok(())
+}
diff --git a/crates/nano-arrow/src/io/ipc/read/array/boolean.rs b/crates/nano-arrow/src/io/ipc/read/array/boolean.rs
new file mode 100644
index 000000000000..6d78c184b168
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/array/boolean.rs
@@ -0,0 +1,72 @@
+use std::collections::VecDeque;
+use std::io::{Read, Seek};
+
+use super::super::read_basic::*;
+use super::super::{Compression, IpcBuffer, Node, OutOfSpecKind};
+use crate::array::BooleanArray;
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+
+#[allow(clippy::too_many_arguments)]
+pub fn read_boolean<R: Read + Seek>(
+    field_nodes: &mut VecDeque<Node>,
+    data_type: DataType,
+    buffers: &mut VecDeque<IpcBuffer>,
+    reader: &mut R,
+    block_offset: u64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+    limit: Option<usize>,
+    scratch: &mut Vec<u8>,
+) -> Result<BooleanArray> {
+    let field_node = field_nodes.pop_front().ok_or_else(|| {
+        Error::oos(format!(
+            "IPC: unable to fetch the field for {data_type:?}. The file or stream is corrupted."
+        ))
+    })?;
+
+    let validity = read_validity(
+        buffers,
+        field_node,
+        reader,
+        block_offset,
+        is_little_endian,
+        compression,
+        limit,
+        scratch,
+    )?;
+
+    let length: usize = field_node
+        .length()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+    let length = limit.map(|limit| limit.min(length)).unwrap_or(length);
+
+    let values = read_bitmap(
+        buffers,
+        length,
+        reader,
+        block_offset,
+        is_little_endian,
+        compression,
+        scratch,
+    )?;
+    BooleanArray::try_new(data_type, values, validity)
+}
+
+pub fn skip_boolean(
+    field_nodes: &mut VecDeque<Node>,
+    buffers: &mut VecDeque<IpcBuffer>,
+) -> Result<()> {
+    let _ = field_nodes.pop_front().ok_or_else(|| {
+        Error::oos("IPC: unable to fetch the field for boolean. The file or stream is corrupted.")
+    })?;
+
+    let _ = buffers
+        .pop_front()
+        .ok_or_else(|| Error::oos("IPC: missing validity buffer."))?;
+    let _ = buffers
+        .pop_front()
+        .ok_or_else(|| Error::oos("IPC: missing values buffer."))?;
+    Ok(())
+}
diff --git a/crates/nano-arrow/src/io/ipc/read/array/dictionary.rs b/crates/nano-arrow/src/io/ipc/read/array/dictionary.rs
new file mode 100644
index 000000000000..554e6d32dcbf
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/array/dictionary.rs
@@ -0,0 +1,65 @@
+use std::collections::VecDeque;
+use std::convert::TryInto;
+use std::io::{Read, Seek};
+
+use ahash::HashSet;
+
+use super::super::{Compression, Dictionaries, IpcBuffer, Node};
+use super::{read_primitive, skip_primitive};
+use crate::array::{DictionaryArray, DictionaryKey};
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+
+#[allow(clippy::too_many_arguments)]
+pub fn read_dictionary<T: DictionaryKey, R: Read + Seek>(
+    field_nodes: &mut VecDeque<Node>,
+    data_type: DataType,
+    id: Option<i64>,
+    buffers: &mut VecDeque<IpcBuffer>,
+    reader: &mut R,
+    dictionaries: &Dictionaries,
+    block_offset: u64,
+    compression: Option<Compression>,
+    limit: Option<usize>,
+    is_little_endian: bool,
+    scratch: &mut Vec<u8>,
+) -> Result<DictionaryArray<T>>
+where
+    Vec<u8>: TryInto<T::Bytes>,
+{
+    let id = if let Some(id) = id {
+        id
+    } else {
+        return Err(Error::OutOfSpec("Dictionary has no id.".to_string()));
+    };
+    let values = dictionaries
+        .get(&id)
+        .ok_or_else(|| {
+            let valid_ids = dictionaries.keys().collect::<HashSet<_>>();
+            Error::OutOfSpec(format!(
+                "Dictionary id {id} not found. Valid ids: {valid_ids:?}"
+            ))
+        })?
+        .clone();
+
+    let keys = read_primitive(
+        field_nodes,
+        T::PRIMITIVE.into(),
+        buffers,
+        reader,
+        block_offset,
+        is_little_endian,
+        compression,
+        limit,
+        scratch,
+    )?;
+
+    DictionaryArray::<T>::try_new(data_type, keys, values)
+}
+
+pub fn skip_dictionary(
+    field_nodes: &mut VecDeque<Node>,
+    buffers: &mut VecDeque<IpcBuffer>,
+) -> Result<()> {
+    skip_primitive(field_nodes, buffers)
+}
diff --git a/crates/nano-arrow/src/io/ipc/read/array/fixed_size_binary.rs b/crates/nano-arrow/src/io/ipc/read/array/fixed_size_binary.rs
new file mode 100644
index 000000000000..ed0d0049ffb2
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/array/fixed_size_binary.rs
@@ -0,0 +1,76 @@
+use std::collections::VecDeque;
+use std::io::{Read, Seek};
+
+use super::super::read_basic::*;
+use super::super::{Compression, IpcBuffer, Node, OutOfSpecKind};
+use crate::array::FixedSizeBinaryArray;
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+
+#[allow(clippy::too_many_arguments)]
+pub fn read_fixed_size_binary<R: Read + Seek>(
+    field_nodes: &mut VecDeque<Node>,
+    data_type: DataType,
+    buffers: &mut VecDeque<IpcBuffer>,
+    reader: &mut R,
+    block_offset: u64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+    limit: Option<usize>,
+    scratch: &mut Vec<u8>,
+) -> Result<FixedSizeBinaryArray> {
+    let field_node = field_nodes.pop_front().ok_or_else(|| {
+        Error::oos(format!(
+            "IPC: unable to fetch the field for {data_type:?}. The file or stream is corrupted."
+        ))
+    })?;
+
+    let validity = read_validity(
+        buffers,
+        field_node,
+        reader,
+        block_offset,
+        is_little_endian,
+        compression,
+        limit,
+        scratch,
+    )?;
+
+    let length: usize = field_node
+        .length()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+    let length = limit.map(|limit| limit.min(length)).unwrap_or(length);
+
+    let length = length.saturating_mul(FixedSizeBinaryArray::maybe_get_size(&data_type)?);
+    let values = read_buffer(
+        buffers,
+        length,
+        reader,
+        block_offset,
+        is_little_endian,
+        compression,
+        scratch,
+    )?;
+
+    FixedSizeBinaryArray::try_new(data_type, values, validity)
+}
+
+pub fn skip_fixed_size_binary(
+    field_nodes: &mut VecDeque<Node>,
+    buffers: &mut VecDeque<IpcBuffer>,
+) -> Result<()> {
+    let _ = field_nodes.pop_front().ok_or_else(|| {
+        Error::oos(
+            "IPC: unable to fetch the field for fixed-size binary. The file or stream is corrupted.",
+        )
+    })?;
+
+    let _ = buffers
+        .pop_front()
+        .ok_or_else(|| Error::oos("IPC: missing validity buffer."))?;
+    let _ = buffers
+        .pop_front()
+        .ok_or_else(|| Error::oos("IPC: missing values buffer."))?;
+    Ok(())
+}
diff --git a/crates/nano-arrow/src/io/ipc/read/array/fixed_size_list.rs b/crates/nano-arrow/src/io/ipc/read/array/fixed_size_list.rs
new file mode 100644
index 000000000000..5553c1f478ff
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/array/fixed_size_list.rs
@@ -0,0 +1,83 @@
+use std::collections::VecDeque;
+use std::io::{Read, Seek};
+
+use super::super::super::IpcField;
+use super::super::deserialize::{read, skip};
+use super::super::read_basic::*;
+use super::super::{Compression, Dictionaries, IpcBuffer, Node, Version};
+use crate::array::FixedSizeListArray;
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+
+#[allow(clippy::too_many_arguments)]
+pub fn read_fixed_size_list<R: Read + Seek>(
+    field_nodes: &mut VecDeque<Node>,
+    data_type: DataType,
+    ipc_field: &IpcField,
+    buffers: &mut VecDeque<IpcBuffer>,
+    reader: &mut R,
+    dictionaries: &Dictionaries,
+    block_offset: u64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+    limit: Option<usize>,
+    version: Version,
+    scratch: &mut Vec<u8>,
+) -> Result<FixedSizeListArray> {
+    let field_node = field_nodes.pop_front().ok_or_else(|| {
+        Error::oos(format!(
+            "IPC: unable to fetch the field for {data_type:?}. The file or stream is corrupted."
+        ))
+    })?;
+
+    let validity = read_validity(
+        buffers,
+        field_node,
+        reader,
+        block_offset,
+        is_little_endian,
+        compression,
+        limit,
+        scratch,
+    )?;
+
+    let (field, size) = FixedSizeListArray::get_child_and_size(&data_type);
+
+    let limit = limit.map(|x| x.saturating_mul(size));
+
+    let values = read(
+        field_nodes,
+        field,
+        &ipc_field.fields[0],
+        buffers,
+        reader,
+        dictionaries,
+        block_offset,
+        is_little_endian,
+        compression,
+        limit,
+        version,
+        scratch,
+    )?;
+    FixedSizeListArray::try_new(data_type, values, validity)
+}
+
+pub fn skip_fixed_size_list(
+    field_nodes: &mut VecDeque<Node>,
+    data_type: &DataType,
+    buffers: &mut VecDeque<IpcBuffer>,
+) -> Result<()> {
+    let _ = field_nodes.pop_front().ok_or_else(|| {
+        Error::oos(
+            "IPC: unable to fetch the field for fixed-size list. The file or stream is corrupted.",
+        )
+    })?;
+
+    let _ = buffers
+        .pop_front()
+        .ok_or_else(|| Error::oos("IPC: missing validity buffer."))?;
+
+    let (field, _) = FixedSizeListArray::get_child_and_size(data_type);
+
+    skip(field_nodes, field.data_type(), buffers)
+}
diff --git a/crates/nano-arrow/src/io/ipc/read/array/list.rs b/crates/nano-arrow/src/io/ipc/read/array/list.rs
new file mode 100644
index 000000000000..83809cf995c1
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/array/list.rs
@@ -0,0 +1,108 @@
+use std::collections::VecDeque;
+use std::convert::TryInto;
+use std::io::{Read, Seek};
+
+use super::super::super::IpcField;
+use super::super::deserialize::{read, skip};
+use super::super::read_basic::*;
+use super::super::{Compression, Dictionaries, IpcBuffer, Node, OutOfSpecKind, Version};
+use crate::array::ListArray;
+use crate::buffer::Buffer;
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+use crate::offset::Offset;
+
+#[allow(clippy::too_many_arguments)]
+pub fn read_list<O: Offset, R: Read + Seek>(
+    field_nodes: &mut VecDeque<Node>,
+    data_type: DataType,
+    ipc_field: &IpcField,
+    buffers: &mut VecDeque<IpcBuffer>,
+    reader: &mut R,
+    dictionaries: &Dictionaries,
+    block_offset: u64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+    limit: Option<usize>,
+    version: Version,
+    scratch: &mut Vec<u8>,
+) -> Result<ListArray<O>>
+where
+    Vec<u8>: TryInto<O::Bytes>,
+{
+    let field_node = field_nodes.pop_front().ok_or_else(|| {
+        Error::oos(format!(
+            "IPC: unable to fetch the field for {data_type:?}. The file or stream is corrupted."
+        ))
+    })?;
+
+    let validity = read_validity(
+        buffers,
+        field_node,
+        reader,
+        block_offset,
+        is_little_endian,
+        compression,
+        limit,
+        scratch,
+    )?;
+
+    let length: usize = field_node
+        .length()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+    let length = limit.map(|limit| limit.min(length)).unwrap_or(length);
+
+    let offsets = read_buffer::<O, _>(
+        buffers,
+        1 + length,
+        reader,
+        block_offset,
+        is_little_endian,
+        compression,
+        scratch,
+    )
+    // Older versions of the IPC format sometimes do not report an offset
+    .or_else(|_| Result::Ok(Buffer::<O>::from(vec![O::default()])))?;
+
+    let last_offset = offsets.last().unwrap().to_usize();
+
+    let field = ListArray::<O>::get_child_field(&data_type);
+
+    let values = read(
+        field_nodes,
+        field,
+        &ipc_field.fields[0],
+        buffers,
+        reader,
+        dictionaries,
+        block_offset,
+        is_little_endian,
+        compression,
+        Some(last_offset),
+        version,
+        scratch,
+    )?;
+    ListArray::try_new(data_type, offsets.try_into()?, values, validity)
+}
+
+pub fn skip_list<O: Offset>(
+    field_nodes: &mut VecDeque<Node>,
+    data_type: &DataType,
+    buffers: &mut VecDeque<IpcBuffer>,
+) -> Result<()> {
+    let _ = field_nodes.pop_front().ok_or_else(|| {
+        Error::oos("IPC: unable to fetch the field for list. The file or stream is corrupted.")
+    })?;
+
+    let _ = buffers
+        .pop_front()
+        .ok_or_else(|| Error::oos("IPC: missing validity buffer."))?;
+    let _ = buffers
+        .pop_front()
+        .ok_or_else(|| Error::oos("IPC: missing offsets buffer."))?;
+
+    let data_type = ListArray::<O>::get_child_type(data_type);
+
+    skip(field_nodes, data_type, buffers)
+}
diff --git a/crates/nano-arrow/src/io/ipc/read/array/map.rs b/crates/nano-arrow/src/io/ipc/read/array/map.rs
new file mode 100644
index 000000000000..cf383407a8c0
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/array/map.rs
@@ -0,0 +1,103 @@
+use std::collections::VecDeque;
+use std::io::{Read, Seek};
+
+use super::super::super::IpcField;
+use super::super::deserialize::{read, skip};
+use super::super::read_basic::*;
+use super::super::{Compression, Dictionaries, IpcBuffer, Node, OutOfSpecKind, Version};
+use crate::array::MapArray;
+use crate::buffer::Buffer;
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+
+#[allow(clippy::too_many_arguments)]
+pub fn read_map<R: Read + Seek>(
+    field_nodes: &mut VecDeque<Node>,
+    data_type: DataType,
+    ipc_field: &IpcField,
+    buffers: &mut VecDeque<IpcBuffer>,
+    reader: &mut R,
+    dictionaries: &Dictionaries,
+    block_offset: u64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+    limit: Option<usize>,
+    version: Version,
+    scratch: &mut Vec<u8>,
+) -> Result<MapArray> {
+    let field_node = field_nodes.pop_front().ok_or_else(|| {
+        Error::oos(format!(
+            "IPC: unable to fetch the field for {data_type:?}. The file or stream is corrupted."
+        ))
+    })?;
+
+    let validity = read_validity(
+        buffers,
+        field_node,
+        reader,
+        block_offset,
+        is_little_endian,
+        compression,
+        limit,
+        scratch,
+    )?;
+
+    let length: usize = field_node
+        .length()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+    let length = limit.map(|limit| limit.min(length)).unwrap_or(length);
+
+    let offsets = read_buffer::<i32, _>(
+        buffers,
+        1 + length,
+        reader,
+        block_offset,
+        is_little_endian,
+        compression,
+        scratch,
+    )
+    // Older versions of the IPC format sometimes do not report an offset
+    .or_else(|_| Result::Ok(Buffer::<i32>::from(vec![0i32])))?;
+
+    let field = MapArray::get_field(&data_type);
+
+    let last_offset: usize = offsets.last().copied().unwrap() as usize;
+
+    let field = read(
+        field_nodes,
+        field,
+        &ipc_field.fields[0],
+        buffers,
+        reader,
+        dictionaries,
+        block_offset,
+        is_little_endian,
+        compression,
+        Some(last_offset),
+        version,
+        scratch,
+    )?;
+    MapArray::try_new(data_type, offsets.try_into()?, field, validity)
+}
+
+pub fn skip_map(
+    field_nodes: &mut VecDeque<Node>,
+    data_type: &DataType,
+    buffers: &mut VecDeque<IpcBuffer>,
+) -> Result<()> {
+    let _ = field_nodes.pop_front().ok_or_else(|| {
+        Error::oos("IPC: unable to fetch the field for map. The file or stream is corrupted.")
+    })?;
+
+    let _ = buffers
+        .pop_front()
+        .ok_or_else(|| Error::oos("IPC: missing validity buffer."))?;
+    let _ = buffers
+        .pop_front()
+        .ok_or_else(|| Error::oos("IPC: missing offsets buffer."))?;
+
+    let data_type = MapArray::get_field(data_type).data_type();
+
+    skip(field_nodes, data_type, buffers)
+}
diff --git a/crates/nano-arrow/src/io/ipc/read/array/mod.rs b/crates/nano-arrow/src/io/ipc/read/array/mod.rs
new file mode 100644
index 000000000000..249e5e05e165
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/array/mod.rs
@@ -0,0 +1,24 @@
+mod primitive;
+pub use primitive::*;
+mod boolean;
+pub use boolean::*;
+mod utf8;
+pub use utf8::*;
+mod binary;
+pub use binary::*;
+mod fixed_size_binary;
+pub use fixed_size_binary::*;
+mod list;
+pub use list::*;
+mod fixed_size_list;
+pub use fixed_size_list::*;
+mod struct_;
+pub use struct_::*;
+mod null;
+pub use null::*;
+mod dictionary;
+pub use dictionary::*;
+mod union;
+pub use union::*;
+mod map;
+pub use map::*;
diff --git a/crates/nano-arrow/src/io/ipc/read/array/null.rs b/crates/nano-arrow/src/io/ipc/read/array/null.rs
new file mode 100644
index 000000000000..e56f1886112d
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/array/null.rs
@@ -0,0 +1,28 @@
+use std::collections::VecDeque;
+
+use super::super::{Node, OutOfSpecKind};
+use crate::array::NullArray;
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+
+pub fn read_null(field_nodes: &mut VecDeque<Node>, data_type: DataType) -> Result<NullArray> {
+    let field_node = field_nodes.pop_front().ok_or_else(|| {
+        Error::oos(format!(
+            "IPC: unable to fetch the field for {data_type:?}. The file or stream is corrupted."
+        ))
+    })?;
+
+    let length: usize = field_node
+        .length()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    NullArray::try_new(data_type, length)
+}
+
+pub fn skip_null(field_nodes: &mut VecDeque<Node>) -> Result<()> {
+    let _ = field_nodes.pop_front().ok_or_else(|| {
+        Error::oos("IPC: unable to fetch the field for null. The file or stream is corrupted.")
+    })?;
+    Ok(())
+}
diff --git a/crates/nano-arrow/src/io/ipc/read/array/primitive.rs b/crates/nano-arrow/src/io/ipc/read/array/primitive.rs
new file mode 100644
index 000000000000..d6ccb581ffe5
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/array/primitive.rs
@@ -0,0 +1,77 @@
+use std::collections::VecDeque;
+use std::convert::TryInto;
+use std::io::{Read, Seek};
+
+use super::super::read_basic::*;
+use super::super::{Compression, IpcBuffer, Node, OutOfSpecKind};
+use crate::array::PrimitiveArray;
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+use crate::types::NativeType;
+
+#[allow(clippy::too_many_arguments)]
+pub fn read_primitive<T: NativeType, R: Read + Seek>(
+    field_nodes: &mut VecDeque<Node>,
+    data_type: DataType,
+    buffers: &mut VecDeque<IpcBuffer>,
+    reader: &mut R,
+    block_offset: u64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+    limit: Option<usize>,
+    scratch: &mut Vec<u8>,
+) -> Result<PrimitiveArray<T>>
+where
+    Vec<u8>: TryInto<T::Bytes>,
+{
+    let field_node = field_nodes.pop_front().ok_or_else(|| {
+        Error::oos(format!(
+            "IPC: unable to fetch the field for {data_type:?}. The file or stream is corrupted."
+        ))
+    })?;
+
+    let validity = read_validity(
+        buffers,
+        field_node,
+        reader,
+        block_offset,
+        is_little_endian,
+        compression,
+        limit,
+        scratch,
+    )?;
+
+    let length: usize = field_node
+        .length()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+    let length = limit.map(|limit| limit.min(length)).unwrap_or(length);
+
+    let values = read_buffer(
+        buffers,
+        length,
+        reader,
+        block_offset,
+        is_little_endian,
+        compression,
+        scratch,
+    )?;
+    PrimitiveArray::<T>::try_new(data_type, values, validity)
+}
+
+pub fn skip_primitive(
+    field_nodes: &mut VecDeque<Node>,
+    buffers: &mut VecDeque<IpcBuffer>,
+) -> Result<()> {
+    let _ = field_nodes.pop_front().ok_or_else(|| {
+        Error::oos("IPC: unable to fetch the field for primitive. The file or stream is corrupted.")
+    })?;
+
+    let _ = buffers
+        .pop_front()
+        .ok_or_else(|| Error::oos("IPC: missing validity buffer."))?;
+    let _ = buffers
+        .pop_front()
+        .ok_or_else(|| Error::oos("IPC: missing values buffer."))?;
+    Ok(())
+}
diff --git a/crates/nano-arrow/src/io/ipc/read/array/struct_.rs b/crates/nano-arrow/src/io/ipc/read/array/struct_.rs
new file mode 100644
index 000000000000..9a5084a8783f
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/array/struct_.rs
@@ -0,0 +1,88 @@
+use std::collections::VecDeque;
+use std::io::{Read, Seek};
+
+use super::super::super::IpcField;
+use super::super::deserialize::{read, skip};
+use super::super::read_basic::*;
+use super::super::{Compression, Dictionaries, IpcBuffer, Node, Version};
+use crate::array::StructArray;
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+
+#[allow(clippy::too_many_arguments)]
+pub fn read_struct<R: Read + Seek>(
+    field_nodes: &mut VecDeque<Node>,
+    data_type: DataType,
+    ipc_field: &IpcField,
+    buffers: &mut VecDeque<IpcBuffer>,
+    reader: &mut R,
+    dictionaries: &Dictionaries,
+    block_offset: u64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+    limit: Option<usize>,
+    version: Version,
+    scratch: &mut Vec<u8>,
+) -> Result<StructArray> {
+    let field_node = field_nodes.pop_front().ok_or_else(|| {
+        Error::oos(format!(
+            "IPC: unable to fetch the field for {data_type:?}. The file or stream is corrupted."
+        ))
+    })?;
+
+    let validity = read_validity(
+        buffers,
+        field_node,
+        reader,
+        block_offset,
+        is_little_endian,
+        compression,
+        limit,
+        scratch,
+    )?;
+
+    let fields = StructArray::get_fields(&data_type);
+
+    let values = fields
+        .iter()
+        .zip(ipc_field.fields.iter())
+        .map(|(field, ipc_field)| {
+            read(
+                field_nodes,
+                field,
+                ipc_field,
+                buffers,
+                reader,
+                dictionaries,
+                block_offset,
+                is_little_endian,
+                compression,
+                limit,
+                version,
+                scratch,
+            )
+        })
+        .collect::<Result<Vec<_>>>()?;
+
+    StructArray::try_new(data_type, values, validity)
+}
+
+pub fn skip_struct(
+    field_nodes: &mut VecDeque<Node>,
+    data_type: &DataType,
+    buffers: &mut VecDeque<IpcBuffer>,
+) -> Result<()> {
+    let _ = field_nodes.pop_front().ok_or_else(|| {
+        Error::oos("IPC: unable to fetch the field for struct. The file or stream is corrupted.")
+    })?;
+
+    let _ = buffers
+        .pop_front()
+        .ok_or_else(|| Error::oos("IPC: missing validity buffer."))?;
+
+    let fields = StructArray::get_fields(data_type);
+
+    fields
+        .iter()
+        .try_for_each(|field| skip(field_nodes, field.data_type(), buffers))
+}
diff --git a/crates/nano-arrow/src/io/ipc/read/array/union.rs b/crates/nano-arrow/src/io/ipc/read/array/union.rs
new file mode 100644
index 000000000000..ac1eb9b02527
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/array/union.rs
@@ -0,0 +1,125 @@
+use std::collections::VecDeque;
+use std::io::{Read, Seek};
+
+use super::super::super::IpcField;
+use super::super::deserialize::{read, skip};
+use super::super::read_basic::*;
+use super::super::{Compression, Dictionaries, IpcBuffer, Node, OutOfSpecKind, Version};
+use crate::array::UnionArray;
+use crate::datatypes::DataType;
+use crate::datatypes::UnionMode::Dense;
+use crate::error::{Error, Result};
+
+#[allow(clippy::too_many_arguments)]
+pub fn read_union<R: Read + Seek>(
+    field_nodes: &mut VecDeque<Node>,
+    data_type: DataType,
+    ipc_field: &IpcField,
+    buffers: &mut VecDeque<IpcBuffer>,
+    reader: &mut R,
+    dictionaries: &Dictionaries,
+    block_offset: u64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+    limit: Option<usize>,
+    version: Version,
+    scratch: &mut Vec<u8>,
+) -> Result<UnionArray> {
+    let field_node = field_nodes.pop_front().ok_or_else(|| {
+        Error::oos(format!(
+            "IPC: unable to fetch the field for {data_type:?}. The file or stream is corrupted."
+        ))
+    })?;
+
+    if version != Version::V5 {
+        let _ = buffers
+            .pop_front()
+            .ok_or_else(|| Error::oos("IPC: missing validity buffer."))?;
+    };
+
+    let length: usize = field_node
+        .length()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+    let length = limit.map(|limit| limit.min(length)).unwrap_or(length);
+
+    let types = read_buffer(
+        buffers,
+        length,
+        reader,
+        block_offset,
+        is_little_endian,
+        compression,
+        scratch,
+    )?;
+
+    let offsets = if let DataType::Union(_, _, mode) = data_type {
+        if !mode.is_sparse() {
+            Some(read_buffer(
+                buffers,
+                length,
+                reader,
+                block_offset,
+                is_little_endian,
+                compression,
+                scratch,
+            )?)
+        } else {
+            None
+        }
+    } else {
+        unreachable!()
+    };
+
+    let fields = UnionArray::get_fields(&data_type);
+
+    let fields = fields
+        .iter()
+        .zip(ipc_field.fields.iter())
+        .map(|(field, ipc_field)| {
+            read(
+                field_nodes,
+                field,
+                ipc_field,
+                buffers,
+                reader,
+                dictionaries,
+                block_offset,
+                is_little_endian,
+                compression,
+                None,
+                version,
+                scratch,
+            )
+        })
+        .collect::<Result<Vec<_>>>()?;
+
+    UnionArray::try_new(data_type, types, fields, offsets)
+}
+
+pub fn skip_union(
+    field_nodes: &mut VecDeque<Node>,
+    data_type: &DataType,
+    buffers: &mut VecDeque<IpcBuffer>,
+) -> Result<()> {
+    let _ = field_nodes.pop_front().ok_or_else(|| {
+        Error::oos("IPC: unable to fetch the field for struct. The file or stream is corrupted.")
+    })?;
+
+    let _ = buffers
+        .pop_front()
+        .ok_or_else(|| Error::oos("IPC: missing validity buffer."))?;
+    if let DataType::Union(_, _, Dense) = data_type {
+        let _ = buffers
+            .pop_front()
+            .ok_or_else(|| Error::oos("IPC: missing offsets buffer."))?;
+    } else {
+        unreachable!()
+    };
+
+    let fields = UnionArray::get_fields(data_type);
+
+    fields
+        .iter()
+        .try_for_each(|field| skip(field_nodes, field.data_type(), buffers))
+}
diff --git a/crates/nano-arrow/src/io/ipc/read/array/utf8.rs b/crates/nano-arrow/src/io/ipc/read/array/utf8.rs
new file mode 100644
index 000000000000..21e54480e48e
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/array/utf8.rs
@@ -0,0 +1,92 @@
+use std::collections::VecDeque;
+use std::io::{Read, Seek};
+
+use super::super::read_basic::*;
+use super::super::{Compression, IpcBuffer, Node, OutOfSpecKind};
+use crate::array::Utf8Array;
+use crate::buffer::Buffer;
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+use crate::offset::Offset;
+
+#[allow(clippy::too_many_arguments)]
+pub fn read_utf8<O: Offset, R: Read + Seek>(
+    field_nodes: &mut VecDeque<Node>,
+    data_type: DataType,
+    buffers: &mut VecDeque<IpcBuffer>,
+    reader: &mut R,
+    block_offset: u64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+    limit: Option<usize>,
+    scratch: &mut Vec<u8>,
+) -> Result<Utf8Array<O>> {
+    let field_node = field_nodes.pop_front().ok_or_else(|| {
+        Error::oos(format!(
+            "IPC: unable to fetch the field for {data_type:?}. The file or stream is corrupted."
+        ))
+    })?;
+
+    let validity = read_validity(
+        buffers,
+        field_node,
+        reader,
+        block_offset,
+        is_little_endian,
+        compression,
+        limit,
+        scratch,
+    )?;
+
+    let length: usize = field_node
+        .length()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let length = limit.map(|limit| limit.min(length)).unwrap_or(length);
+
+    let offsets: Buffer<O> = read_buffer(
+        buffers,
+        1 + length,
+        reader,
+        block_offset,
+        is_little_endian,
+        compression,
+        scratch,
+    )
+    // Older versions of the IPC format sometimes do not report an offset
+    .or_else(|_| Result::Ok(Buffer::<O>::from(vec![O::default()])))?;
+
+    let last_offset = offsets.last().unwrap().to_usize();
+    let values = read_buffer(
+        buffers,
+        last_offset,
+        reader,
+        block_offset,
+        is_little_endian,
+        compression,
+        scratch,
+    )?;
+
+    Utf8Array::<O>::try_new(data_type, offsets.try_into()?, values, validity)
+}
+
+pub fn skip_utf8(
+    field_nodes: &mut VecDeque<Node>,
+    buffers: &mut VecDeque<IpcBuffer>,
+) -> Result<()> {
+    let _ = field_nodes.pop_front().ok_or_else(|| {
+        Error::oos("IPC: unable to fetch the field for utf8. The file or stream is corrupted.")
+    })?;
+
+    let _ = buffers
+        .pop_front()
+        .ok_or_else(|| Error::oos("IPC: missing validity buffer."))?;
+    let _ = buffers
+        .pop_front()
+        .ok_or_else(|| Error::oos("IPC: missing offsets buffer."))?;
+    let _ = buffers
+        .pop_front()
+        .ok_or_else(|| Error::oos("IPC: missing values buffer."))?;
+    Ok(())
+}
diff --git a/crates/nano-arrow/src/io/ipc/read/common.rs b/crates/nano-arrow/src/io/ipc/read/common.rs
new file mode 100644
index 000000000000..f890562ed41c
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/common.rs
@@ -0,0 +1,363 @@
+use std::collections::VecDeque;
+use std::io::{Read, Seek};
+
+use ahash::AHashMap;
+use arrow_format;
+
+use super::deserialize::{read, skip};
+use super::Dictionaries;
+use crate::array::*;
+use crate::chunk::Chunk;
+use crate::datatypes::{DataType, Field};
+use crate::error::{Error, Result};
+use crate::io::ipc::read::OutOfSpecKind;
+use crate::io::ipc::{IpcField, IpcSchema};
+
+#[derive(Debug, Eq, PartialEq, Hash)]
+enum ProjectionResult<A> {
+    Selected(A),
+    NotSelected(A),
+}
+
+/// An iterator adapter that will return `Some(x)` or `None`
+/// # Panics
+/// The iterator panics iff the `projection` is not strictly increasing.
+struct ProjectionIter<'a, A, I: Iterator<Item = A>> {
+    projection: &'a [usize],
+    iter: I,
+    current_count: usize,
+    current_projection: usize,
+}
+
+impl<'a, A, I: Iterator<Item = A>> ProjectionIter<'a, A, I> {
+    /// # Panics
+    /// iff `projection` is empty
+    pub fn new(projection: &'a [usize], iter: I) -> Self {
+        Self {
+            projection: &projection[1..],
+            iter,
+            current_count: 0,
+            current_projection: projection[0],
+        }
+    }
+}
+
+impl<'a, A, I: Iterator<Item = A>> Iterator for ProjectionIter<'a, A, I> {
+    type Item = ProjectionResult<A>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        if let Some(item) = self.iter.next() {
+            let result = if self.current_count == self.current_projection {
+                if !self.projection.is_empty() {
+                    assert!(self.projection[0] > self.current_projection);
+                    self.current_projection = self.projection[0];
+                    self.projection = &self.projection[1..];
+                } else {
+                    self.current_projection = 0 // a value that most likely already passed
+                };
+                Some(ProjectionResult::Selected(item))
+            } else {
+                Some(ProjectionResult::NotSelected(item))
+            };
+            self.current_count += 1;
+            result
+        } else {
+            None
+        }
+    }
+
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        self.iter.size_hint()
+    }
+}
+
+/// Returns a [`Chunk`] from a reader.
+/// # Panic
+/// Panics iff the projection is not in increasing order (e.g. `[1, 0]` nor `[0, 1, 1]` are valid)
+#[allow(clippy::too_many_arguments)]
+pub fn read_record_batch<R: Read + Seek>(
+    batch: arrow_format::ipc::RecordBatchRef,
+    fields: &[Field],
+    ipc_schema: &IpcSchema,
+    projection: Option<&[usize]>,
+    limit: Option<usize>,
+    dictionaries: &Dictionaries,
+    version: arrow_format::ipc::MetadataVersion,
+    reader: &mut R,
+    block_offset: u64,
+    file_size: u64,
+    scratch: &mut Vec<u8>,
+) -> Result<Chunk<Box<dyn Array>>> {
+    assert_eq!(fields.len(), ipc_schema.fields.len());
+    let buffers = batch
+        .buffers()
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferBuffers(err)))?
+        .ok_or_else(|| Error::from(OutOfSpecKind::MissingMessageBuffers))?;
+    let mut buffers: VecDeque<arrow_format::ipc::BufferRef> = buffers.iter().collect();
+
+    // check that the sum of the sizes of all buffers is <= than the size of the file
+    let buffers_size = buffers
+        .iter()
+        .map(|buffer| {
+            let buffer_size: u64 = buffer
+                .length()
+                .try_into()
+                .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+            Ok(buffer_size)
+        })
+        .sum::<Result<u64>>()?;
+    if buffers_size > file_size {
+        return Err(Error::from(OutOfSpecKind::InvalidBuffersLength {
+            buffers_size,
+            file_size,
+        }));
+    }
+
+    let field_nodes = batch
+        .nodes()
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferNodes(err)))?
+        .ok_or_else(|| Error::from(OutOfSpecKind::MissingMessageNodes))?;
+    let mut field_nodes = field_nodes.iter().collect::<VecDeque<_>>();
+
+    let columns = if let Some(projection) = projection {
+        let projection =
+            ProjectionIter::new(projection, fields.iter().zip(ipc_schema.fields.iter()));
+
+        projection
+            .map(|maybe_field| match maybe_field {
+                ProjectionResult::Selected((field, ipc_field)) => Ok(Some(read(
+                    &mut field_nodes,
+                    field,
+                    ipc_field,
+                    &mut buffers,
+                    reader,
+                    dictionaries,
+                    block_offset,
+                    ipc_schema.is_little_endian,
+                    batch.compression().map_err(|err| {
+                        Error::from(OutOfSpecKind::InvalidFlatbufferCompression(err))
+                    })?,
+                    limit,
+                    version,
+                    scratch,
+                )?)),
+                ProjectionResult::NotSelected((field, _)) => {
+                    skip(&mut field_nodes, &field.data_type, &mut buffers)?;
+                    Ok(None)
+                },
+            })
+            .filter_map(|x| x.transpose())
+            .collect::<Result<Vec<_>>>()?
+    } else {
+        fields
+            .iter()
+            .zip(ipc_schema.fields.iter())
+            .map(|(field, ipc_field)| {
+                read(
+                    &mut field_nodes,
+                    field,
+                    ipc_field,
+                    &mut buffers,
+                    reader,
+                    dictionaries,
+                    block_offset,
+                    ipc_schema.is_little_endian,
+                    batch.compression().map_err(|err| {
+                        Error::from(OutOfSpecKind::InvalidFlatbufferCompression(err))
+                    })?,
+                    limit,
+                    version,
+                    scratch,
+                )
+            })
+            .collect::<Result<Vec<_>>>()?
+    };
+    Chunk::try_new(columns)
+}
+
+fn find_first_dict_field_d<'a>(
+    id: i64,
+    data_type: &'a DataType,
+    ipc_field: &'a IpcField,
+) -> Option<(&'a Field, &'a IpcField)> {
+    use DataType::*;
+    match data_type {
+        Dictionary(_, inner, _) => find_first_dict_field_d(id, inner.as_ref(), ipc_field),
+        List(field) | LargeList(field) | FixedSizeList(field, ..) | Map(field, ..) => {
+            find_first_dict_field(id, field.as_ref(), &ipc_field.fields[0])
+        },
+        Union(fields, ..) | Struct(fields) => {
+            for (field, ipc_field) in fields.iter().zip(ipc_field.fields.iter()) {
+                if let Some(f) = find_first_dict_field(id, field, ipc_field) {
+                    return Some(f);
+                }
+            }
+            None
+        },
+        _ => None,
+    }
+}
+
+fn find_first_dict_field<'a>(
+    id: i64,
+    field: &'a Field,
+    ipc_field: &'a IpcField,
+) -> Option<(&'a Field, &'a IpcField)> {
+    if let Some(field_id) = ipc_field.dictionary_id {
+        if id == field_id {
+            return Some((field, ipc_field));
+        }
+    }
+    find_first_dict_field_d(id, &field.data_type, ipc_field)
+}
+
+pub(crate) fn first_dict_field<'a>(
+    id: i64,
+    fields: &'a [Field],
+    ipc_fields: &'a [IpcField],
+) -> Result<(&'a Field, &'a IpcField)> {
+    assert_eq!(fields.len(), ipc_fields.len());
+    for (field, ipc_field) in fields.iter().zip(ipc_fields.iter()) {
+        if let Some(field) = find_first_dict_field(id, field, ipc_field) {
+            return Ok(field);
+        }
+    }
+    Err(Error::from(OutOfSpecKind::InvalidId { requested_id: id }))
+}
+
+/// Reads a dictionary from the reader,
+/// updating `dictionaries` with the resulting dictionary
+#[allow(clippy::too_many_arguments)]
+pub fn read_dictionary<R: Read + Seek>(
+    batch: arrow_format::ipc::DictionaryBatchRef,
+    fields: &[Field],
+    ipc_schema: &IpcSchema,
+    dictionaries: &mut Dictionaries,
+    reader: &mut R,
+    block_offset: u64,
+    file_size: u64,
+    scratch: &mut Vec<u8>,
+) -> Result<()> {
+    if batch
+        .is_delta()
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferIsDelta(err)))?
+    {
+        return Err(Error::NotYetImplemented(
+            "delta dictionary batches not supported".to_string(),
+        ));
+    }
+
+    let id = batch
+        .id()
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferId(err)))?;
+    let (first_field, first_ipc_field) = first_dict_field(id, fields, &ipc_schema.fields)?;
+
+    let batch = batch
+        .data()
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferData(err)))?
+        .ok_or_else(|| Error::from(OutOfSpecKind::MissingData))?;
+
+    let value_type =
+        if let DataType::Dictionary(_, value_type, _) = first_field.data_type.to_logical_type() {
+            value_type.as_ref()
+        } else {
+            return Err(Error::from(OutOfSpecKind::InvalidIdDataType {
+                requested_id: id,
+            }));
+        };
+
+    // Make a fake schema for the dictionary batch.
+    let fields = vec![Field::new("", value_type.clone(), false)];
+    let ipc_schema = IpcSchema {
+        fields: vec![first_ipc_field.clone()],
+        is_little_endian: ipc_schema.is_little_endian,
+    };
+    let chunk = read_record_batch(
+        batch,
+        &fields,
+        &ipc_schema,
+        None,
+        None, // we must read the whole dictionary
+        dictionaries,
+        arrow_format::ipc::MetadataVersion::V5,
+        reader,
+        block_offset,
+        file_size,
+        scratch,
+    )?;
+
+    dictionaries.insert(id, chunk.into_arrays().pop().unwrap());
+
+    Ok(())
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn project_iter() {
+        let iter = 1..6;
+        let iter = ProjectionIter::new(&[0, 2, 4], iter);
+        let result: Vec<_> = iter.collect();
+        use ProjectionResult::*;
+        assert_eq!(
+            result,
+            vec![
+                Selected(1),
+                NotSelected(2),
+                Selected(3),
+                NotSelected(4),
+                Selected(5)
+            ]
+        )
+    }
+}
+
+pub fn prepare_projection(
+    fields: &[Field],
+    mut projection: Vec<usize>,
+) -> (Vec<usize>, AHashMap<usize, usize>, Vec<Field>) {
+    let fields = projection.iter().map(|x| fields[*x].clone()).collect();
+
+    // todo: find way to do this more efficiently
+    let mut indices = (0..projection.len()).collect::<Vec<_>>();
+    indices.sort_unstable_by_key(|&i| &projection[i]);
+    let map = indices.iter().copied().enumerate().fold(
+        AHashMap::default(),
+        |mut acc, (index, new_index)| {
+            acc.insert(index, new_index);
+            acc
+        },
+    );
+    projection.sort_unstable();
+
+    // check unique
+    if !projection.is_empty() {
+        let mut previous = projection[0];
+
+        for &i in &projection[1..] {
+            assert!(
+                previous < i,
+                "The projection on IPC must not contain duplicates"
+            );
+            previous = i;
+        }
+    }
+
+    (projection, map, fields)
+}
+
+pub fn apply_projection(
+    chunk: Chunk<Box<dyn Array>>,
+    map: &AHashMap<usize, usize>,
+) -> Chunk<Box<dyn Array>> {
+    // re-order according to projection
+    let arrays = chunk.into_arrays();
+    let mut new_arrays = arrays.clone();
+
+    map.iter()
+        .for_each(|(old, new)| new_arrays[*new] = arrays[*old].clone());
+
+    Chunk::new(new_arrays)
+}
diff --git a/crates/nano-arrow/src/io/ipc/read/deserialize.rs b/crates/nano-arrow/src/io/ipc/read/deserialize.rs
new file mode 100644
index 000000000000..28f8b9e68191
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/deserialize.rs
@@ -0,0 +1,251 @@
+use std::collections::VecDeque;
+use std::io::{Read, Seek};
+
+use arrow_format::ipc::{BodyCompressionRef, MetadataVersion};
+
+use super::array::*;
+use super::{Dictionaries, IpcBuffer, Node};
+use crate::array::*;
+use crate::datatypes::{DataType, Field, PhysicalType};
+use crate::error::Result;
+use crate::io::ipc::IpcField;
+
+#[allow(clippy::too_many_arguments)]
+pub fn read<R: Read + Seek>(
+    field_nodes: &mut VecDeque<Node>,
+    field: &Field,
+    ipc_field: &IpcField,
+    buffers: &mut VecDeque<IpcBuffer>,
+    reader: &mut R,
+    dictionaries: &Dictionaries,
+    block_offset: u64,
+    is_little_endian: bool,
+    compression: Option<BodyCompressionRef>,
+    limit: Option<usize>,
+    version: MetadataVersion,
+    scratch: &mut Vec<u8>,
+) -> Result<Box<dyn Array>> {
+    use PhysicalType::*;
+    let data_type = field.data_type.clone();
+
+    match data_type.to_physical_type() {
+        Null => read_null(field_nodes, data_type).map(|x| x.boxed()),
+        Boolean => read_boolean(
+            field_nodes,
+            data_type,
+            buffers,
+            reader,
+            block_offset,
+            is_little_endian,
+            compression,
+            limit,
+            scratch,
+        )
+        .map(|x| x.boxed()),
+        Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+            read_primitive::<$T, _>(
+                field_nodes,
+                data_type,
+                buffers,
+                reader,
+                block_offset,
+                is_little_endian,
+                compression,
+                limit,
+                scratch,
+            )
+            .map(|x| x.boxed())
+        }),
+        Binary => read_binary::<i32, _>(
+            field_nodes,
+            data_type,
+            buffers,
+            reader,
+            block_offset,
+            is_little_endian,
+            compression,
+            limit,
+            scratch,
+        )
+        .map(|x| x.boxed()),
+        LargeBinary => read_binary::<i64, _>(
+            field_nodes,
+            data_type,
+            buffers,
+            reader,
+            block_offset,
+            is_little_endian,
+            compression,
+            limit,
+            scratch,
+        )
+        .map(|x| x.boxed()),
+        FixedSizeBinary => read_fixed_size_binary(
+            field_nodes,
+            data_type,
+            buffers,
+            reader,
+            block_offset,
+            is_little_endian,
+            compression,
+            limit,
+            scratch,
+        )
+        .map(|x| x.boxed()),
+        Utf8 => read_utf8::<i32, _>(
+            field_nodes,
+            data_type,
+            buffers,
+            reader,
+            block_offset,
+            is_little_endian,
+            compression,
+            limit,
+            scratch,
+        )
+        .map(|x| x.boxed()),
+        LargeUtf8 => read_utf8::<i64, _>(
+            field_nodes,
+            data_type,
+            buffers,
+            reader,
+            block_offset,
+            is_little_endian,
+            compression,
+            limit,
+            scratch,
+        )
+        .map(|x| x.boxed()),
+        List => read_list::<i32, _>(
+            field_nodes,
+            data_type,
+            ipc_field,
+            buffers,
+            reader,
+            dictionaries,
+            block_offset,
+            is_little_endian,
+            compression,
+            limit,
+            version,
+            scratch,
+        )
+        .map(|x| x.boxed()),
+        LargeList => read_list::<i64, _>(
+            field_nodes,
+            data_type,
+            ipc_field,
+            buffers,
+            reader,
+            dictionaries,
+            block_offset,
+            is_little_endian,
+            compression,
+            limit,
+            version,
+            scratch,
+        )
+        .map(|x| x.boxed()),
+        FixedSizeList => read_fixed_size_list(
+            field_nodes,
+            data_type,
+            ipc_field,
+            buffers,
+            reader,
+            dictionaries,
+            block_offset,
+            is_little_endian,
+            compression,
+            limit,
+            version,
+            scratch,
+        )
+        .map(|x| x.boxed()),
+        Struct => read_struct(
+            field_nodes,
+            data_type,
+            ipc_field,
+            buffers,
+            reader,
+            dictionaries,
+            block_offset,
+            is_little_endian,
+            compression,
+            limit,
+            version,
+            scratch,
+        )
+        .map(|x| x.boxed()),
+        Dictionary(key_type) => {
+            match_integer_type!(key_type, |$T| {
+                read_dictionary::<$T, _>(
+                    field_nodes,
+                    data_type,
+                    ipc_field.dictionary_id,
+                    buffers,
+                    reader,
+                    dictionaries,
+                    block_offset,
+                    compression,
+                    limit,
+                    is_little_endian,
+                    scratch,
+                )
+                .map(|x| x.boxed())
+            })
+        },
+        Union => read_union(
+            field_nodes,
+            data_type,
+            ipc_field,
+            buffers,
+            reader,
+            dictionaries,
+            block_offset,
+            is_little_endian,
+            compression,
+            limit,
+            version,
+            scratch,
+        )
+        .map(|x| x.boxed()),
+        Map => read_map(
+            field_nodes,
+            data_type,
+            ipc_field,
+            buffers,
+            reader,
+            dictionaries,
+            block_offset,
+            is_little_endian,
+            compression,
+            limit,
+            version,
+            scratch,
+        )
+        .map(|x| x.boxed()),
+    }
+}
+
+pub fn skip(
+    field_nodes: &mut VecDeque<Node>,
+    data_type: &DataType,
+    buffers: &mut VecDeque<IpcBuffer>,
+) -> Result<()> {
+    use PhysicalType::*;
+    match data_type.to_physical_type() {
+        Null => skip_null(field_nodes),
+        Boolean => skip_boolean(field_nodes, buffers),
+        Primitive(_) => skip_primitive(field_nodes, buffers),
+        LargeBinary | Binary => skip_binary(field_nodes, buffers),
+        LargeUtf8 | Utf8 => skip_utf8(field_nodes, buffers),
+        FixedSizeBinary => skip_fixed_size_binary(field_nodes, buffers),
+        List => skip_list::<i32>(field_nodes, data_type, buffers),
+        LargeList => skip_list::<i64>(field_nodes, data_type, buffers),
+        FixedSizeList => skip_fixed_size_list(field_nodes, data_type, buffers),
+        Struct => skip_struct(field_nodes, data_type, buffers),
+        Dictionary(_) => skip_dictionary(field_nodes, buffers),
+        Union => skip_union(field_nodes, data_type, buffers),
+        Map => skip_map(field_nodes, data_type, buffers),
+    }
+}
diff --git a/crates/nano-arrow/src/io/ipc/read/error.rs b/crates/nano-arrow/src/io/ipc/read/error.rs
new file mode 100644
index 000000000000..cbac69aef2e3
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/error.rs
@@ -0,0 +1,112 @@
+use crate::error::Error;
+
+/// The different types of errors that reading from IPC can cause
+#[derive(Debug)]
+#[non_exhaustive]
+pub enum OutOfSpecKind {
+    /// The IPC file does not start with [b'A', b'R', b'R', b'O', b'W', b'1']
+    InvalidHeader,
+    /// The IPC file does not end with [b'A', b'R', b'R', b'O', b'W', b'1']
+    InvalidFooter,
+    /// The first 4 bytes of the last 10 bytes is < 0
+    NegativeFooterLength,
+    /// The footer is an invalid flatbuffer
+    InvalidFlatbufferFooter(arrow_format::ipc::planus::Error),
+    /// The file's footer does not contain record batches
+    MissingRecordBatches,
+    /// The footer's record batches is an invalid flatbuffer
+    InvalidFlatbufferRecordBatches(arrow_format::ipc::planus::Error),
+    /// The file's footer does not contain a schema
+    MissingSchema,
+    /// The footer's schema is an invalid flatbuffer
+    InvalidFlatbufferSchema(arrow_format::ipc::planus::Error),
+    /// The file's schema does not contain fields
+    MissingFields,
+    /// The footer's dictionaries is an invalid flatbuffer
+    InvalidFlatbufferDictionaries(arrow_format::ipc::planus::Error),
+    /// The block is an invalid flatbuffer
+    InvalidFlatbufferBlock(arrow_format::ipc::planus::Error),
+    /// The dictionary message is an invalid flatbuffer
+    InvalidFlatbufferMessage(arrow_format::ipc::planus::Error),
+    /// The message does not contain a header
+    MissingMessageHeader,
+    /// The message's header is an invalid flatbuffer
+    InvalidFlatbufferHeader(arrow_format::ipc::planus::Error),
+    /// Relative positions in the file is < 0
+    UnexpectedNegativeInteger,
+    /// dictionaries can only contain dictionary messages; record batches can only contain records
+    UnexpectedMessageType,
+    /// RecordBatch messages do not contain buffers
+    MissingMessageBuffers,
+    /// The message's buffers is an invalid flatbuffer
+    InvalidFlatbufferBuffers(arrow_format::ipc::planus::Error),
+    /// RecordBatch messages does not contain nodes
+    MissingMessageNodes,
+    /// The message's nodes is an invalid flatbuffer
+    InvalidFlatbufferNodes(arrow_format::ipc::planus::Error),
+    /// The message's body length is an invalid flatbuffer
+    InvalidFlatbufferBodyLength(arrow_format::ipc::planus::Error),
+    /// The message does not contain data
+    MissingData,
+    /// The message's data is an invalid flatbuffer
+    InvalidFlatbufferData(arrow_format::ipc::planus::Error),
+    /// The version is an invalid flatbuffer
+    InvalidFlatbufferVersion(arrow_format::ipc::planus::Error),
+    /// The compression is an invalid flatbuffer
+    InvalidFlatbufferCompression(arrow_format::ipc::planus::Error),
+    /// The record contains a number of buffers that does not match the required number by the data type
+    ExpectedBuffer,
+    /// A buffer's size is smaller than the required for the number of elements
+    InvalidBuffer {
+        /// Declared number of elements in the buffer
+        length: usize,
+        /// The name of the `NativeType`
+        type_name: &'static str,
+        /// Bytes required for the `length` and `type`
+        required_number_of_bytes: usize,
+        /// The size of the IPC buffer
+        buffer_length: usize,
+    },
+    /// A buffer's size is larger than the file size
+    InvalidBuffersLength {
+        /// number of bytes of all buffers in the record
+        buffers_size: u64,
+        /// the size of the file
+        file_size: u64,
+    },
+    /// A bitmap's size is smaller than the required for the number of elements
+    InvalidBitmap {
+        /// Declared length of the bitmap
+        length: usize,
+        /// Number of bits on the IPC buffer
+        number_of_bits: usize,
+    },
+    /// The dictionary is_delta is an invalid flatbuffer
+    InvalidFlatbufferIsDelta(arrow_format::ipc::planus::Error),
+    /// The dictionary id is an invalid flatbuffer
+    InvalidFlatbufferId(arrow_format::ipc::planus::Error),
+    /// Invalid dictionary id
+    InvalidId {
+        /// The requested dictionary id
+        requested_id: i64,
+    },
+    /// Field id is not a dictionary
+    InvalidIdDataType {
+        /// The requested dictionary id
+        requested_id: i64,
+    },
+    /// FixedSizeBinaryArray has invalid datatype.
+    InvalidDataType,
+}
+
+impl From<OutOfSpecKind> for Error {
+    fn from(kind: OutOfSpecKind) -> Self {
+        Error::OutOfSpec(format!("{kind:?}"))
+    }
+}
+
+impl From<arrow_format::ipc::planus::Error> for Error {
+    fn from(error: arrow_format::ipc::planus::Error) -> Self {
+        Error::OutOfSpec(error.to_string())
+    }
+}
diff --git a/crates/nano-arrow/src/io/ipc/read/file.rs b/crates/nano-arrow/src/io/ipc/read/file.rs
new file mode 100644
index 000000000000..ec0084a08614
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/file.rs
@@ -0,0 +1,321 @@
+use std::convert::TryInto;
+use std::io::{Read, Seek, SeekFrom};
+
+use ahash::AHashMap;
+use arrow_format::ipc::planus::ReadAsRoot;
+
+use super::super::{ARROW_MAGIC_V1, ARROW_MAGIC_V2, CONTINUATION_MARKER};
+use super::common::*;
+use super::schema::fb_to_schema;
+use super::{Dictionaries, OutOfSpecKind};
+use crate::array::Array;
+use crate::chunk::Chunk;
+use crate::datatypes::Schema;
+use crate::error::{Error, Result};
+use crate::io::ipc::IpcSchema;
+
+/// Metadata of an Arrow IPC file, written in the footer of the file.
+#[derive(Debug, Clone)]
+pub struct FileMetadata {
+    /// The schema that is read from the file footer
+    pub schema: Schema,
+
+    /// The files' [`IpcSchema`]
+    pub ipc_schema: IpcSchema,
+
+    /// The blocks in the file
+    ///
+    /// A block indicates the regions in the file to read to get data
+    pub blocks: Vec<arrow_format::ipc::Block>,
+
+    /// Dictionaries associated to each dict_id
+    pub(crate) dictionaries: Option<Vec<arrow_format::ipc::Block>>,
+
+    /// The total size of the file in bytes
+    pub size: u64,
+}
+
+fn read_dictionary_message<R: Read + Seek>(
+    reader: &mut R,
+    offset: u64,
+    data: &mut Vec<u8>,
+) -> Result<()> {
+    let mut message_size: [u8; 4] = [0; 4];
+    reader.seek(SeekFrom::Start(offset))?;
+    reader.read_exact(&mut message_size)?;
+    if message_size == CONTINUATION_MARKER {
+        reader.read_exact(&mut message_size)?;
+    };
+    let message_length = i32::from_le_bytes(message_size);
+
+    let message_length: usize = message_length
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    data.clear();
+    data.try_reserve(message_length)?;
+    reader
+        .by_ref()
+        .take(message_length as u64)
+        .read_to_end(data)?;
+
+    Ok(())
+}
+
+pub(crate) fn get_dictionary_batch<'a>(
+    message: &'a arrow_format::ipc::MessageRef,
+) -> Result<arrow_format::ipc::DictionaryBatchRef<'a>> {
+    let header = message
+        .header()
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferHeader(err)))?
+        .ok_or_else(|| Error::from(OutOfSpecKind::MissingMessageHeader))?;
+    match header {
+        arrow_format::ipc::MessageHeaderRef::DictionaryBatch(batch) => Ok(batch),
+        _ => Err(Error::from(OutOfSpecKind::UnexpectedMessageType)),
+    }
+}
+
+fn read_dictionary_block<R: Read + Seek>(
+    reader: &mut R,
+    metadata: &FileMetadata,
+    block: &arrow_format::ipc::Block,
+    dictionaries: &mut Dictionaries,
+    message_scratch: &mut Vec<u8>,
+    dictionary_scratch: &mut Vec<u8>,
+) -> Result<()> {
+    let offset: u64 = block
+        .offset
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::UnexpectedNegativeInteger))?;
+    let length: u64 = block
+        .meta_data_length
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::UnexpectedNegativeInteger))?;
+    read_dictionary_message(reader, offset, message_scratch)?;
+
+    let message = arrow_format::ipc::MessageRef::read_as_root(message_scratch.as_ref())
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferMessage(err)))?;
+
+    let batch = get_dictionary_batch(&message)?;
+
+    read_dictionary(
+        batch,
+        &metadata.schema.fields,
+        &metadata.ipc_schema,
+        dictionaries,
+        reader,
+        offset + length,
+        metadata.size,
+        dictionary_scratch,
+    )
+}
+
+/// Reads all file's dictionaries, if any
+/// This function is IO-bounded
+pub fn read_file_dictionaries<R: Read + Seek>(
+    reader: &mut R,
+    metadata: &FileMetadata,
+    scratch: &mut Vec<u8>,
+) -> Result<Dictionaries> {
+    let mut dictionaries = Default::default();
+
+    let blocks = if let Some(blocks) = &metadata.dictionaries {
+        blocks
+    } else {
+        return Ok(AHashMap::new());
+    };
+    // use a temporary smaller scratch for the messages
+    let mut message_scratch = Default::default();
+
+    for block in blocks {
+        read_dictionary_block(
+            reader,
+            metadata,
+            block,
+            &mut dictionaries,
+            &mut message_scratch,
+            scratch,
+        )?;
+    }
+    Ok(dictionaries)
+}
+
+/// Reads the footer's length and magic number in footer
+fn read_footer_len<R: Read + Seek>(reader: &mut R) -> Result<(u64, usize)> {
+    // read footer length and magic number in footer
+    let end = reader.seek(SeekFrom::End(-10))? + 10;
+
+    let mut footer: [u8; 10] = [0; 10];
+
+    reader.read_exact(&mut footer)?;
+    let footer_len = i32::from_le_bytes(footer[..4].try_into().unwrap());
+
+    if footer[4..] != ARROW_MAGIC_V2 {
+        return Err(Error::from(OutOfSpecKind::InvalidFooter));
+    }
+    let footer_len = footer_len
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    Ok((end, footer_len))
+}
+
+pub(super) fn deserialize_footer(footer_data: &[u8], size: u64) -> Result<FileMetadata> {
+    let footer = arrow_format::ipc::FooterRef::read_as_root(footer_data)
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferFooter(err)))?;
+
+    let blocks = footer
+        .record_batches()
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferRecordBatches(err)))?
+        .ok_or_else(|| Error::from(OutOfSpecKind::MissingRecordBatches))?;
+
+    let blocks = blocks
+        .iter()
+        .map(|block| {
+            block
+                .try_into()
+                .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferRecordBatches(err)))
+        })
+        .collect::<Result<Vec<_>>>()?;
+
+    let ipc_schema = footer
+        .schema()
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferSchema(err)))?
+        .ok_or_else(|| Error::from(OutOfSpecKind::MissingSchema))?;
+    let (schema, ipc_schema) = fb_to_schema(ipc_schema)?;
+
+    let dictionaries = footer
+        .dictionaries()
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferDictionaries(err)))?
+        .map(|dictionaries| {
+            dictionaries
+                .into_iter()
+                .map(|block| {
+                    block.try_into().map_err(|err| {
+                        Error::from(OutOfSpecKind::InvalidFlatbufferRecordBatches(err))
+                    })
+                })
+                .collect::<Result<Vec<_>>>()
+        })
+        .transpose()?;
+
+    Ok(FileMetadata {
+        schema,
+        ipc_schema,
+        blocks,
+        dictionaries,
+        size,
+    })
+}
+
+/// Read the Arrow IPC file's metadata
+pub fn read_file_metadata<R: Read + Seek>(reader: &mut R) -> Result<FileMetadata> {
+    // check if header contain the correct magic bytes
+    let mut magic_buffer: [u8; 6] = [0; 6];
+    let start = reader.stream_position()?;
+    reader.read_exact(&mut magic_buffer)?;
+    if magic_buffer != ARROW_MAGIC_V2 {
+        if magic_buffer[..4] == ARROW_MAGIC_V1 {
+            return Err(Error::NotYetImplemented("feather v1 not supported".into()));
+        }
+        return Err(Error::from(OutOfSpecKind::InvalidHeader));
+    }
+
+    let (end, footer_len) = read_footer_len(reader)?;
+
+    // read footer
+    reader.seek(SeekFrom::End(-10 - footer_len as i64))?;
+
+    let mut serialized_footer = vec![];
+    serialized_footer.try_reserve(footer_len)?;
+    reader
+        .by_ref()
+        .take(footer_len as u64)
+        .read_to_end(&mut serialized_footer)?;
+
+    deserialize_footer(&serialized_footer, end - start)
+}
+
+pub(crate) fn get_record_batch(
+    message: arrow_format::ipc::MessageRef,
+) -> Result<arrow_format::ipc::RecordBatchRef> {
+    let header = message
+        .header()
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferHeader(err)))?
+        .ok_or_else(|| Error::from(OutOfSpecKind::MissingMessageHeader))?;
+    match header {
+        arrow_format::ipc::MessageHeaderRef::RecordBatch(batch) => Ok(batch),
+        _ => Err(Error::from(OutOfSpecKind::UnexpectedMessageType)),
+    }
+}
+
+/// Reads the record batch at position `index` from the reader.
+///
+/// This function is useful for random access to the file. For example, if
+/// you have indexed the file somewhere else, this allows pruning
+/// certain parts of the file.
+/// # Panics
+/// This function panics iff `index >= metadata.blocks.len()`
+#[allow(clippy::too_many_arguments)]
+pub fn read_batch<R: Read + Seek>(
+    reader: &mut R,
+    dictionaries: &Dictionaries,
+    metadata: &FileMetadata,
+    projection: Option<&[usize]>,
+    limit: Option<usize>,
+    index: usize,
+    message_scratch: &mut Vec<u8>,
+    data_scratch: &mut Vec<u8>,
+) -> Result<Chunk<Box<dyn Array>>> {
+    let block = metadata.blocks[index];
+
+    let offset: u64 = block
+        .offset
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let length: u64 = block
+        .meta_data_length
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    // read length
+    reader.seek(SeekFrom::Start(offset))?;
+    let mut meta_buf = [0; 4];
+    reader.read_exact(&mut meta_buf)?;
+    if meta_buf == CONTINUATION_MARKER {
+        // continuation marker encountered, read message next
+        reader.read_exact(&mut meta_buf)?;
+    }
+    let meta_len = i32::from_le_bytes(meta_buf)
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::UnexpectedNegativeInteger))?;
+
+    message_scratch.clear();
+    message_scratch.try_reserve(meta_len)?;
+    reader
+        .by_ref()
+        .take(meta_len as u64)
+        .read_to_end(message_scratch)?;
+
+    let message = arrow_format::ipc::MessageRef::read_as_root(message_scratch.as_ref())
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferMessage(err)))?;
+
+    let batch = get_record_batch(message)?;
+
+    read_record_batch(
+        batch,
+        &metadata.schema.fields,
+        &metadata.ipc_schema,
+        projection,
+        limit,
+        dictionaries,
+        message
+            .version()
+            .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferVersion(err)))?,
+        reader,
+        offset + length,
+        metadata.size,
+        data_scratch,
+    )
+}
diff --git a/crates/nano-arrow/src/io/ipc/read/file_async.rs b/crates/nano-arrow/src/io/ipc/read/file_async.rs
new file mode 100644
index 000000000000..df1895021282
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/file_async.rs
@@ -0,0 +1,349 @@
+//! Async reader for Arrow IPC files
+use std::io::SeekFrom;
+
+use ahash::AHashMap;
+use arrow_format::ipc::planus::ReadAsRoot;
+use arrow_format::ipc::{Block, MessageHeaderRef};
+use futures::stream::BoxStream;
+use futures::{AsyncRead, AsyncReadExt, AsyncSeek, AsyncSeekExt, Stream, StreamExt};
+
+use super::common::{apply_projection, prepare_projection, read_dictionary, read_record_batch};
+use super::file::{deserialize_footer, get_record_batch};
+use super::{Dictionaries, FileMetadata, OutOfSpecKind};
+use crate::array::*;
+use crate::chunk::Chunk;
+use crate::datatypes::{Field, Schema};
+use crate::error::{Error, Result};
+use crate::io::ipc::{IpcSchema, ARROW_MAGIC_V2, CONTINUATION_MARKER};
+
+/// Async reader for Arrow IPC files
+pub struct FileStream<'a> {
+    stream: BoxStream<'a, Result<Chunk<Box<dyn Array>>>>,
+    schema: Option<Schema>,
+    metadata: FileMetadata,
+}
+
+impl<'a> FileStream<'a> {
+    /// Create a new IPC file reader.
+    ///
+    /// # Examples
+    /// See [`FileSink`](crate::io::ipc::write::file_async::FileSink).
+    pub fn new<R>(
+        reader: R,
+        metadata: FileMetadata,
+        projection: Option<Vec<usize>>,
+        limit: Option<usize>,
+    ) -> Self
+    where
+        R: AsyncRead + AsyncSeek + Unpin + Send + 'a,
+    {
+        let (projection, schema) = if let Some(projection) = projection {
+            let (p, h, fields) = prepare_projection(&metadata.schema.fields, projection);
+            let schema = Schema {
+                fields,
+                metadata: metadata.schema.metadata.clone(),
+            };
+            (Some((p, h)), Some(schema))
+        } else {
+            (None, None)
+        };
+
+        let stream = Self::stream(reader, None, metadata.clone(), projection, limit);
+        Self {
+            stream,
+            metadata,
+            schema,
+        }
+    }
+
+    /// Get the metadata from the IPC file.
+    pub fn metadata(&self) -> &FileMetadata {
+        &self.metadata
+    }
+
+    /// Get the projected schema from the IPC file.
+    pub fn schema(&self) -> &Schema {
+        self.schema.as_ref().unwrap_or(&self.metadata.schema)
+    }
+
+    fn stream<R>(
+        mut reader: R,
+        mut dictionaries: Option<Dictionaries>,
+        metadata: FileMetadata,
+        projection: Option<(Vec<usize>, AHashMap<usize, usize>)>,
+        limit: Option<usize>,
+    ) -> BoxStream<'a, Result<Chunk<Box<dyn Array>>>>
+    where
+        R: AsyncRead + AsyncSeek + Unpin + Send + 'a,
+    {
+        async_stream::try_stream! {
+            // read dictionaries
+            cached_read_dictionaries(&mut reader, &metadata, &mut dictionaries).await?;
+
+            let mut meta_buffer = Default::default();
+            let mut block_buffer = Default::default();
+            let mut scratch = Default::default();
+            let mut remaining = limit.unwrap_or(usize::MAX);
+            for block in 0..metadata.blocks.len() {
+                let chunk = read_batch(
+                    &mut reader,
+                    dictionaries.as_mut().unwrap(),
+                    &metadata,
+                    projection.as_ref().map(|x| x.0.as_ref()),
+                    Some(remaining),
+                    block,
+                    &mut meta_buffer,
+                    &mut block_buffer,
+                    &mut scratch
+                ).await?;
+                remaining -= chunk.len();
+
+                let chunk = if let Some((_, map)) = &projection {
+                    // re-order according to projection
+                    apply_projection(chunk, map)
+                } else {
+                    chunk
+                };
+
+                yield chunk;
+            }
+        }
+        .boxed()
+    }
+}
+
+impl<'a> Stream for FileStream<'a> {
+    type Item = Result<Chunk<Box<dyn Array>>>;
+
+    fn poll_next(
+        self: std::pin::Pin<&mut Self>,
+        cx: &mut std::task::Context<'_>,
+    ) -> std::task::Poll<Option<Self::Item>> {
+        self.get_mut().stream.poll_next_unpin(cx)
+    }
+}
+
+/// Reads the footer's length and magic number in footer
+async fn read_footer_len<R: AsyncRead + AsyncSeek + Unpin>(reader: &mut R) -> Result<usize> {
+    // read footer length and magic number in footer
+    reader.seek(SeekFrom::End(-10)).await?;
+    let mut footer: [u8; 10] = [0; 10];
+
+    reader.read_exact(&mut footer).await?;
+    let footer_len = i32::from_le_bytes(footer[..4].try_into().unwrap());
+
+    if footer[4..] != ARROW_MAGIC_V2 {
+        return Err(Error::from(OutOfSpecKind::InvalidFooter));
+    }
+    footer_len
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))
+}
+
+/// Read the metadata from an IPC file.
+pub async fn read_file_metadata_async<R>(reader: &mut R) -> Result<FileMetadata>
+where
+    R: AsyncRead + AsyncSeek + Unpin,
+{
+    let footer_size = read_footer_len(reader).await?;
+    // Read footer
+    reader.seek(SeekFrom::End(-10 - footer_size as i64)).await?;
+
+    let mut footer = vec![];
+    footer.try_reserve(footer_size)?;
+    reader
+        .take(footer_size as u64)
+        .read_to_end(&mut footer)
+        .await?;
+
+    deserialize_footer(&footer, u64::MAX)
+}
+
+#[allow(clippy::too_many_arguments)]
+async fn read_batch<R>(
+    mut reader: R,
+    dictionaries: &mut Dictionaries,
+    metadata: &FileMetadata,
+    projection: Option<&[usize]>,
+    limit: Option<usize>,
+    block: usize,
+    meta_buffer: &mut Vec<u8>,
+    block_buffer: &mut Vec<u8>,
+    scratch: &mut Vec<u8>,
+) -> Result<Chunk<Box<dyn Array>>>
+where
+    R: AsyncRead + AsyncSeek + Unpin,
+{
+    let block = metadata.blocks[block];
+
+    let offset: u64 = block
+        .offset
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    reader.seek(SeekFrom::Start(offset)).await?;
+    let mut meta_buf = [0; 4];
+    reader.read_exact(&mut meta_buf).await?;
+    if meta_buf == CONTINUATION_MARKER {
+        reader.read_exact(&mut meta_buf).await?;
+    }
+
+    let meta_len = i32::from_le_bytes(meta_buf)
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::UnexpectedNegativeInteger))?;
+
+    meta_buffer.clear();
+    meta_buffer.try_reserve(meta_len)?;
+    (&mut reader)
+        .take(meta_len as u64)
+        .read_to_end(meta_buffer)
+        .await?;
+
+    let message = arrow_format::ipc::MessageRef::read_as_root(meta_buffer)
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferMessage(err)))?;
+
+    let batch = get_record_batch(message)?;
+
+    let block_length: usize = message
+        .body_length()
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferBodyLength(err)))?
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::UnexpectedNegativeInteger))?;
+
+    block_buffer.clear();
+    block_buffer.try_reserve(block_length)?;
+    reader
+        .take(block_length as u64)
+        .read_to_end(block_buffer)
+        .await?;
+
+    let mut cursor = std::io::Cursor::new(&block_buffer);
+
+    read_record_batch(
+        batch,
+        &metadata.schema.fields,
+        &metadata.ipc_schema,
+        projection,
+        limit,
+        dictionaries,
+        message
+            .version()
+            .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferVersion(err)))?,
+        &mut cursor,
+        0,
+        metadata.size,
+        scratch,
+    )
+}
+
+async fn read_dictionaries<R>(
+    mut reader: R,
+    fields: &[Field],
+    ipc_schema: &IpcSchema,
+    blocks: &[Block],
+    scratch: &mut Vec<u8>,
+) -> Result<Dictionaries>
+where
+    R: AsyncRead + AsyncSeek + Unpin,
+{
+    let mut dictionaries = Default::default();
+    let mut data: Vec<u8> = vec![];
+    let mut buffer: Vec<u8> = vec![];
+
+    for block in blocks {
+        let offset: u64 = block
+            .offset
+            .try_into()
+            .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+        let length: usize = block
+            .body_length
+            .try_into()
+            .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+        read_dictionary_message(&mut reader, offset, &mut data).await?;
+
+        let message = arrow_format::ipc::MessageRef::read_as_root(data.as_ref())
+            .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferMessage(err)))?;
+
+        let header = message
+            .header()
+            .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferHeader(err)))?
+            .ok_or_else(|| Error::from(OutOfSpecKind::MissingMessageHeader))?;
+
+        match header {
+            MessageHeaderRef::DictionaryBatch(batch) => {
+                buffer.clear();
+                buffer.try_reserve(length)?;
+                (&mut reader)
+                    .take(length as u64)
+                    .read_to_end(&mut buffer)
+                    .await?;
+                let mut cursor = std::io::Cursor::new(&buffer);
+                read_dictionary(
+                    batch,
+                    fields,
+                    ipc_schema,
+                    &mut dictionaries,
+                    &mut cursor,
+                    0,
+                    u64::MAX,
+                    scratch,
+                )?;
+            },
+            _ => return Err(Error::from(OutOfSpecKind::UnexpectedMessageType)),
+        }
+    }
+    Ok(dictionaries)
+}
+
+async fn read_dictionary_message<R>(mut reader: R, offset: u64, data: &mut Vec<u8>) -> Result<()>
+where
+    R: AsyncRead + AsyncSeek + Unpin,
+{
+    let mut message_size = [0; 4];
+    reader.seek(SeekFrom::Start(offset)).await?;
+    reader.read_exact(&mut message_size).await?;
+    if message_size == CONTINUATION_MARKER {
+        reader.read_exact(&mut message_size).await?;
+    }
+    let footer_size = i32::from_le_bytes(message_size);
+
+    let footer_size: usize = footer_size
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    data.clear();
+    data.try_reserve(footer_size)?;
+    (&mut reader)
+        .take(footer_size as u64)
+        .read_to_end(data)
+        .await?;
+
+    Ok(())
+}
+
+async fn cached_read_dictionaries<R: AsyncRead + AsyncSeek + Unpin>(
+    reader: &mut R,
+    metadata: &FileMetadata,
+    dictionaries: &mut Option<Dictionaries>,
+) -> Result<()> {
+    match (&dictionaries, metadata.dictionaries.as_deref()) {
+        (None, Some(blocks)) => {
+            let new_dictionaries = read_dictionaries(
+                reader,
+                &metadata.schema.fields,
+                &metadata.ipc_schema,
+                blocks,
+                &mut Default::default(),
+            )
+            .await?;
+            *dictionaries = Some(new_dictionaries);
+        },
+        (None, None) => {
+            *dictionaries = Some(Default::default());
+        },
+        _ => {},
+    };
+    Ok(())
+}
diff --git a/crates/nano-arrow/src/io/ipc/read/mod.rs b/crates/nano-arrow/src/io/ipc/read/mod.rs
new file mode 100644
index 000000000000..887cf7b36258
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/mod.rs
@@ -0,0 +1,45 @@
+//! APIs to read Arrow's IPC format.
+//!
+//! The two important structs here are the [`FileReader`](reader::FileReader),
+//! which provides arbitrary access to any of its messages, and the
+//! [`StreamReader`](stream::StreamReader), which only supports reading
+//! data in the order it was written in.
+use ahash::AHashMap;
+
+use crate::array::Array;
+
+mod array;
+mod common;
+mod deserialize;
+mod error;
+pub(crate) mod file;
+mod read_basic;
+mod reader;
+mod schema;
+mod stream;
+
+pub use error::OutOfSpecKind;
+
+#[cfg(feature = "io_ipc_read_async")]
+#[cfg_attr(docsrs, doc(cfg(feature = "io_ipc_read_async")))]
+pub mod stream_async;
+
+#[cfg(feature = "io_ipc_read_async")]
+#[cfg_attr(docsrs, doc(cfg(feature = "io_ipc_read_async")))]
+pub mod file_async;
+
+pub(crate) use common::first_dict_field;
+#[cfg(feature = "io_flight")]
+pub(crate) use common::{read_dictionary, read_record_batch};
+pub use file::{read_batch, read_file_dictionaries, read_file_metadata, FileMetadata};
+pub use reader::FileReader;
+pub use schema::deserialize_schema;
+pub use stream::{read_stream_metadata, StreamMetadata, StreamReader, StreamState};
+
+/// how dictionaries are tracked in this crate
+pub type Dictionaries = AHashMap<i64, Box<dyn Array>>;
+
+pub(crate) type Node<'a> = arrow_format::ipc::FieldNodeRef<'a>;
+pub(crate) type IpcBuffer<'a> = arrow_format::ipc::BufferRef<'a>;
+pub(crate) type Compression<'a> = arrow_format::ipc::BodyCompressionRef<'a>;
+pub(crate) type Version = arrow_format::ipc::MetadataVersion;
diff --git a/crates/nano-arrow/src/io/ipc/read/read_basic.rs b/crates/nano-arrow/src/io/ipc/read/read_basic.rs
new file mode 100644
index 000000000000..a56ebc81b3c4
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/read_basic.rs
@@ -0,0 +1,291 @@
+use std::collections::VecDeque;
+use std::convert::TryInto;
+use std::io::{Read, Seek, SeekFrom};
+
+use super::super::compression;
+use super::super::endianness::is_native_little_endian;
+use super::{Compression, IpcBuffer, Node, OutOfSpecKind};
+use crate::bitmap::Bitmap;
+use crate::buffer::Buffer;
+use crate::error::{Error, Result};
+use crate::types::NativeType;
+
+fn read_swapped<T: NativeType, R: Read + Seek>(
+    reader: &mut R,
+    length: usize,
+    buffer: &mut Vec<T>,
+    is_little_endian: bool,
+) -> Result<()> {
+    // slow case where we must reverse bits
+    let mut slice = vec![0u8; length * std::mem::size_of::<T>()];
+    reader.read_exact(&mut slice)?;
+
+    let chunks = slice.chunks_exact(std::mem::size_of::<T>());
+    if !is_little_endian {
+        // machine is little endian, file is big endian
+        buffer
+            .as_mut_slice()
+            .iter_mut()
+            .zip(chunks)
+            .try_for_each(|(slot, chunk)| {
+                let a: T::Bytes = match chunk.try_into() {
+                    Ok(a) => a,
+                    Err(_) => unreachable!(),
+                };
+                *slot = T::from_be_bytes(a);
+                Result::Ok(())
+            })?;
+    } else {
+        // machine is big endian, file is little endian
+        return Err(Error::NotYetImplemented(
+            "Reading little endian files from big endian machines".to_string(),
+        ));
+    }
+    Ok(())
+}
+
+fn read_uncompressed_buffer<T: NativeType, R: Read + Seek>(
+    reader: &mut R,
+    buffer_length: usize,
+    length: usize,
+    is_little_endian: bool,
+) -> Result<Vec<T>> {
+    let required_number_of_bytes = length.saturating_mul(std::mem::size_of::<T>());
+    if required_number_of_bytes > buffer_length {
+        return Err(Error::from(OutOfSpecKind::InvalidBuffer {
+            length,
+            type_name: std::any::type_name::<T>(),
+            required_number_of_bytes,
+            buffer_length,
+        }));
+        // todo: move this to the error's Display
+        /*
+        return Err(Error::OutOfSpec(
+            format!("The slots of the array times the physical size must \
+            be smaller or equal to the length of the IPC buffer. \
+            However, this array reports {} slots, which, for physical type \"{}\", corresponds to {} bytes, \
+            which is larger than the buffer length {}",
+                length,
+                std::any::type_name::<T>(),
+                bytes,
+                buffer_length,
+            ),
+        ));
+         */
+    }
+
+    // it is undefined behavior to call read_exact on un-initialized, https://doc.rust-lang.org/std/io/trait.Read.html#tymethod.read
+    // see also https://github.com/MaikKlein/ash/issues/354#issue-781730580
+    let mut buffer = vec![T::default(); length];
+
+    if is_native_little_endian() == is_little_endian {
+        // fast case where we can just copy the contents
+        let slice = bytemuck::cast_slice_mut(&mut buffer);
+        reader.read_exact(slice)?;
+    } else {
+        read_swapped(reader, length, &mut buffer, is_little_endian)?;
+    }
+    Ok(buffer)
+}
+
+fn read_compressed_buffer<T: NativeType, R: Read + Seek>(
+    reader: &mut R,
+    buffer_length: usize,
+    length: usize,
+    is_little_endian: bool,
+    compression: Compression,
+    scratch: &mut Vec<u8>,
+) -> Result<Vec<T>> {
+    if is_little_endian != is_native_little_endian() {
+        return Err(Error::NotYetImplemented(
+            "Reading compressed and big endian IPC".to_string(),
+        ));
+    }
+
+    // it is undefined behavior to call read_exact on un-initialized, https://doc.rust-lang.org/std/io/trait.Read.html#tymethod.read
+    // see also https://github.com/MaikKlein/ash/issues/354#issue-781730580
+    let mut buffer = vec![T::default(); length];
+
+    // decompress first
+    scratch.clear();
+    scratch.try_reserve(buffer_length)?;
+    reader
+        .by_ref()
+        .take(buffer_length as u64)
+        .read_to_end(scratch)?;
+
+    let out_slice = bytemuck::cast_slice_mut(&mut buffer);
+
+    let compression = compression
+        .codec()
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferCompression(err)))?;
+
+    match compression {
+        arrow_format::ipc::CompressionType::Lz4Frame => {
+            compression::decompress_lz4(&scratch[8..], out_slice)?;
+        },
+        arrow_format::ipc::CompressionType::Zstd => {
+            compression::decompress_zstd(&scratch[8..], out_slice)?;
+        },
+    }
+    Ok(buffer)
+}
+
+pub fn read_buffer<T: NativeType, R: Read + Seek>(
+    buf: &mut VecDeque<IpcBuffer>,
+    length: usize, // in slots
+    reader: &mut R,
+    block_offset: u64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+    scratch: &mut Vec<u8>,
+) -> Result<Buffer<T>> {
+    let buf = buf
+        .pop_front()
+        .ok_or_else(|| Error::from(OutOfSpecKind::ExpectedBuffer))?;
+
+    let offset: u64 = buf
+        .offset()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let buffer_length: usize = buf
+        .length()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    reader.seek(SeekFrom::Start(block_offset + offset))?;
+
+    if let Some(compression) = compression {
+        Ok(read_compressed_buffer(
+            reader,
+            buffer_length,
+            length,
+            is_little_endian,
+            compression,
+            scratch,
+        )?
+        .into())
+    } else {
+        Ok(read_uncompressed_buffer(reader, buffer_length, length, is_little_endian)?.into())
+    }
+}
+
+fn read_uncompressed_bitmap<R: Read + Seek>(
+    length: usize,
+    bytes: usize,
+    reader: &mut R,
+) -> Result<Vec<u8>> {
+    if length > bytes * 8 {
+        return Err(Error::from(OutOfSpecKind::InvalidBitmap {
+            length,
+            number_of_bits: bytes * 8,
+        }));
+    }
+
+    let mut buffer = vec![];
+    buffer.try_reserve(bytes)?;
+    reader
+        .by_ref()
+        .take(bytes as u64)
+        .read_to_end(&mut buffer)?;
+
+    Ok(buffer)
+}
+
+fn read_compressed_bitmap<R: Read + Seek>(
+    length: usize,
+    bytes: usize,
+    compression: Compression,
+    reader: &mut R,
+    scratch: &mut Vec<u8>,
+) -> Result<Vec<u8>> {
+    let mut buffer = vec![0; (length + 7) / 8];
+
+    scratch.clear();
+    scratch.try_reserve(bytes)?;
+    reader.by_ref().take(bytes as u64).read_to_end(scratch)?;
+
+    let compression = compression
+        .codec()
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferCompression(err)))?;
+
+    match compression {
+        arrow_format::ipc::CompressionType::Lz4Frame => {
+            compression::decompress_lz4(&scratch[8..], &mut buffer)?;
+        },
+        arrow_format::ipc::CompressionType::Zstd => {
+            compression::decompress_zstd(&scratch[8..], &mut buffer)?;
+        },
+    }
+    Ok(buffer)
+}
+
+pub fn read_bitmap<R: Read + Seek>(
+    buf: &mut VecDeque<IpcBuffer>,
+    length: usize,
+    reader: &mut R,
+    block_offset: u64,
+    _: bool,
+    compression: Option<Compression>,
+    scratch: &mut Vec<u8>,
+) -> Result<Bitmap> {
+    let buf = buf
+        .pop_front()
+        .ok_or_else(|| Error::from(OutOfSpecKind::ExpectedBuffer))?;
+
+    let offset: u64 = buf
+        .offset()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let bytes: usize = buf
+        .length()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    reader.seek(SeekFrom::Start(block_offset + offset))?;
+
+    let buffer = if let Some(compression) = compression {
+        read_compressed_bitmap(length, bytes, compression, reader, scratch)
+    } else {
+        read_uncompressed_bitmap(length, bytes, reader)
+    }?;
+
+    Bitmap::try_new(buffer, length)
+}
+
+#[allow(clippy::too_many_arguments)]
+pub fn read_validity<R: Read + Seek>(
+    buffers: &mut VecDeque<IpcBuffer>,
+    field_node: Node,
+    reader: &mut R,
+    block_offset: u64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+    limit: Option<usize>,
+    scratch: &mut Vec<u8>,
+) -> Result<Option<Bitmap>> {
+    let length: usize = field_node
+        .length()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+    let length = limit.map(|limit| limit.min(length)).unwrap_or(length);
+
+    Ok(if field_node.null_count() > 0 {
+        Some(read_bitmap(
+            buffers,
+            length,
+            reader,
+            block_offset,
+            is_little_endian,
+            compression,
+            scratch,
+        )?)
+    } else {
+        let _ = buffers
+            .pop_front()
+            .ok_or_else(|| Error::from(OutOfSpecKind::ExpectedBuffer))?;
+        None
+    })
+}
diff --git a/crates/nano-arrow/src/io/ipc/read/reader.rs b/crates/nano-arrow/src/io/ipc/read/reader.rs
new file mode 100644
index 000000000000..80c900fd9a76
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/reader.rs
@@ -0,0 +1,137 @@
+use std::io::{Read, Seek};
+
+use ahash::AHashMap;
+
+use super::common::*;
+use super::{read_batch, read_file_dictionaries, Dictionaries, FileMetadata};
+use crate::array::Array;
+use crate::chunk::Chunk;
+use crate::datatypes::Schema;
+use crate::error::Result;
+
+/// An iterator of [`Chunk`]s from an Arrow IPC file.
+pub struct FileReader<R: Read + Seek> {
+    reader: R,
+    metadata: FileMetadata,
+    // the dictionaries are going to be read
+    dictionaries: Option<Dictionaries>,
+    current_block: usize,
+    projection: Option<(Vec<usize>, AHashMap<usize, usize>, Schema)>,
+    remaining: usize,
+    data_scratch: Vec<u8>,
+    message_scratch: Vec<u8>,
+}
+
+impl<R: Read + Seek> FileReader<R> {
+    /// Creates a new [`FileReader`]. Use `projection` to only take certain columns.
+    /// # Panic
+    /// Panics iff the projection is not in increasing order (e.g. `[1, 0]` nor `[0, 1, 1]` are valid)
+    pub fn new(
+        reader: R,
+        metadata: FileMetadata,
+        projection: Option<Vec<usize>>,
+        limit: Option<usize>,
+    ) -> Self {
+        let projection = projection.map(|projection| {
+            let (p, h, fields) = prepare_projection(&metadata.schema.fields, projection);
+            let schema = Schema {
+                fields,
+                metadata: metadata.schema.metadata.clone(),
+            };
+            (p, h, schema)
+        });
+        Self {
+            reader,
+            metadata,
+            dictionaries: Default::default(),
+            projection,
+            remaining: limit.unwrap_or(usize::MAX),
+            current_block: 0,
+            data_scratch: Default::default(),
+            message_scratch: Default::default(),
+        }
+    }
+
+    /// Return the schema of the file
+    pub fn schema(&self) -> &Schema {
+        self.projection
+            .as_ref()
+            .map(|x| &x.2)
+            .unwrap_or(&self.metadata.schema)
+    }
+
+    /// Returns the [`FileMetadata`]
+    pub fn metadata(&self) -> &FileMetadata {
+        &self.metadata
+    }
+
+    /// Consumes this FileReader, returning the underlying reader
+    pub fn into_inner(self) -> R {
+        self.reader
+    }
+
+    /// Get the inner memory scratches so they can be reused in a new writer.
+    /// This can be utilized to save memory allocations for performance reasons.
+    pub fn get_scratches(&mut self) -> (Vec<u8>, Vec<u8>) {
+        (
+            std::mem::take(&mut self.data_scratch),
+            std::mem::take(&mut self.message_scratch),
+        )
+    }
+
+    /// Set the inner memory scratches so they can be reused in a new writer.
+    /// This can be utilized to save memory allocations for performance reasons.
+    pub fn set_scratches(&mut self, scratches: (Vec<u8>, Vec<u8>)) {
+        (self.data_scratch, self.message_scratch) = scratches;
+    }
+
+    fn read_dictionaries(&mut self) -> Result<()> {
+        if self.dictionaries.is_none() {
+            self.dictionaries = Some(read_file_dictionaries(
+                &mut self.reader,
+                &self.metadata,
+                &mut self.data_scratch,
+            )?);
+        };
+        Ok(())
+    }
+}
+
+impl<R: Read + Seek> Iterator for FileReader<R> {
+    type Item = Result<Chunk<Box<dyn Array>>>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        // get current block
+        if self.current_block == self.metadata.blocks.len() {
+            return None;
+        }
+
+        match self.read_dictionaries() {
+            Ok(_) => {},
+            Err(e) => return Some(Err(e)),
+        };
+
+        let block = self.current_block;
+        self.current_block += 1;
+
+        let chunk = read_batch(
+            &mut self.reader,
+            self.dictionaries.as_ref().unwrap(),
+            &self.metadata,
+            self.projection.as_ref().map(|x| x.0.as_ref()),
+            Some(self.remaining),
+            block,
+            &mut self.message_scratch,
+            &mut self.data_scratch,
+        );
+        self.remaining -= chunk.as_ref().map(|x| x.len()).unwrap_or_default();
+
+        let chunk = if let Some((_, map, _)) = &self.projection {
+            // re-order according to projection
+            chunk.map(|chunk| apply_projection(chunk, map))
+        } else {
+            chunk
+        };
+        Some(chunk)
+    }
+}
diff --git a/crates/nano-arrow/src/io/ipc/read/schema.rs b/crates/nano-arrow/src/io/ipc/read/schema.rs
new file mode 100644
index 000000000000..1b6687f30c95
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/schema.rs
@@ -0,0 +1,429 @@
+use arrow_format::ipc::planus::ReadAsRoot;
+use arrow_format::ipc::{FieldRef, FixedSizeListRef, MapRef, TimeRef, TimestampRef, UnionRef};
+
+use super::super::{IpcField, IpcSchema};
+use super::{OutOfSpecKind, StreamMetadata};
+use crate::datatypes::{
+    get_extension, DataType, Extension, Field, IntegerType, IntervalUnit, Metadata, Schema,
+    TimeUnit, UnionMode,
+};
+use crate::error::{Error, Result};
+
+fn try_unzip_vec<A, B, I: Iterator<Item = Result<(A, B)>>>(iter: I) -> Result<(Vec<A>, Vec<B>)> {
+    let mut a = vec![];
+    let mut b = vec![];
+    for maybe_item in iter {
+        let (a_i, b_i) = maybe_item?;
+        a.push(a_i);
+        b.push(b_i);
+    }
+
+    Ok((a, b))
+}
+
+fn deserialize_field(ipc_field: arrow_format::ipc::FieldRef) -> Result<(Field, IpcField)> {
+    let metadata = read_metadata(&ipc_field)?;
+
+    let extension = get_extension(&metadata);
+
+    let (data_type, ipc_field_) = get_data_type(ipc_field, extension, true)?;
+
+    let field = Field {
+        name: ipc_field
+            .name()?
+            .ok_or_else(|| Error::oos("Every field in IPC must have a name"))?
+            .to_string(),
+        data_type,
+        is_nullable: ipc_field.nullable()?,
+        metadata,
+    };
+
+    Ok((field, ipc_field_))
+}
+
+fn read_metadata(field: &arrow_format::ipc::FieldRef) -> Result<Metadata> {
+    Ok(if let Some(list) = field.custom_metadata()? {
+        let mut metadata_map = Metadata::new();
+        for kv in list {
+            let kv = kv?;
+            if let (Some(k), Some(v)) = (kv.key()?, kv.value()?) {
+                metadata_map.insert(k.to_string(), v.to_string());
+            }
+        }
+        metadata_map
+    } else {
+        Metadata::default()
+    })
+}
+
+fn deserialize_integer(int: arrow_format::ipc::IntRef) -> Result<IntegerType> {
+    Ok(match (int.bit_width()?, int.is_signed()?) {
+        (8, true) => IntegerType::Int8,
+        (8, false) => IntegerType::UInt8,
+        (16, true) => IntegerType::Int16,
+        (16, false) => IntegerType::UInt16,
+        (32, true) => IntegerType::Int32,
+        (32, false) => IntegerType::UInt32,
+        (64, true) => IntegerType::Int64,
+        (64, false) => IntegerType::UInt64,
+        _ => return Err(Error::oos("IPC: indexType can only be 8, 16, 32 or 64.")),
+    })
+}
+
+fn deserialize_timeunit(time_unit: arrow_format::ipc::TimeUnit) -> Result<TimeUnit> {
+    use arrow_format::ipc::TimeUnit::*;
+    Ok(match time_unit {
+        Second => TimeUnit::Second,
+        Millisecond => TimeUnit::Millisecond,
+        Microsecond => TimeUnit::Microsecond,
+        Nanosecond => TimeUnit::Nanosecond,
+    })
+}
+
+fn deserialize_time(time: TimeRef) -> Result<(DataType, IpcField)> {
+    let unit = deserialize_timeunit(time.unit()?)?;
+
+    let data_type = match (time.bit_width()?, unit) {
+        (32, TimeUnit::Second) => DataType::Time32(TimeUnit::Second),
+        (32, TimeUnit::Millisecond) => DataType::Time32(TimeUnit::Millisecond),
+        (64, TimeUnit::Microsecond) => DataType::Time64(TimeUnit::Microsecond),
+        (64, TimeUnit::Nanosecond) => DataType::Time64(TimeUnit::Nanosecond),
+        (bits, precision) => {
+            return Err(Error::nyi(format!(
+                "Time type with bit width of {bits} and unit of {precision:?}"
+            )))
+        },
+    };
+    Ok((data_type, IpcField::default()))
+}
+
+fn deserialize_timestamp(timestamp: TimestampRef) -> Result<(DataType, IpcField)> {
+    let timezone = timestamp.timezone()?.map(|tz| tz.to_string());
+    let time_unit = deserialize_timeunit(timestamp.unit()?)?;
+    Ok((
+        DataType::Timestamp(time_unit, timezone),
+        IpcField::default(),
+    ))
+}
+
+fn deserialize_union(union_: UnionRef, field: FieldRef) -> Result<(DataType, IpcField)> {
+    let mode = UnionMode::sparse(union_.mode()? == arrow_format::ipc::UnionMode::Sparse);
+    let ids = union_.type_ids()?.map(|x| x.iter().collect());
+
+    let fields = field
+        .children()?
+        .ok_or_else(|| Error::oos("IPC: Union must contain children"))?;
+    if fields.is_empty() {
+        return Err(Error::oos("IPC: Union must contain at least one child"));
+    }
+
+    let (fields, ipc_fields) = try_unzip_vec(fields.iter().map(|field| {
+        let (field, fields) = deserialize_field(field?)?;
+        Ok((field, fields))
+    }))?;
+    let ipc_field = IpcField {
+        fields: ipc_fields,
+        dictionary_id: None,
+    };
+    Ok((DataType::Union(fields, ids, mode), ipc_field))
+}
+
+fn deserialize_map(map: MapRef, field: FieldRef) -> Result<(DataType, IpcField)> {
+    let is_sorted = map.keys_sorted()?;
+
+    let children = field
+        .children()?
+        .ok_or_else(|| Error::oos("IPC: Map must contain children"))?;
+    let inner = children
+        .get(0)
+        .ok_or_else(|| Error::oos("IPC: Map must contain one child"))??;
+    let (field, ipc_field) = deserialize_field(inner)?;
+
+    let data_type = DataType::Map(Box::new(field), is_sorted);
+    Ok((
+        data_type,
+        IpcField {
+            fields: vec![ipc_field],
+            dictionary_id: None,
+        },
+    ))
+}
+
+fn deserialize_struct(field: FieldRef) -> Result<(DataType, IpcField)> {
+    let fields = field
+        .children()?
+        .ok_or_else(|| Error::oos("IPC: Struct must contain children"))?;
+    if fields.is_empty() {
+        return Err(Error::oos("IPC: Struct must contain at least one child"));
+    }
+    let (fields, ipc_fields) = try_unzip_vec(fields.iter().map(|field| {
+        let (field, fields) = deserialize_field(field?)?;
+        Ok((field, fields))
+    }))?;
+    let ipc_field = IpcField {
+        fields: ipc_fields,
+        dictionary_id: None,
+    };
+    Ok((DataType::Struct(fields), ipc_field))
+}
+
+fn deserialize_list(field: FieldRef) -> Result<(DataType, IpcField)> {
+    let children = field
+        .children()?
+        .ok_or_else(|| Error::oos("IPC: List must contain children"))?;
+    let inner = children
+        .get(0)
+        .ok_or_else(|| Error::oos("IPC: List must contain one child"))??;
+    let (field, ipc_field) = deserialize_field(inner)?;
+
+    Ok((
+        DataType::List(Box::new(field)),
+        IpcField {
+            fields: vec![ipc_field],
+            dictionary_id: None,
+        },
+    ))
+}
+
+fn deserialize_large_list(field: FieldRef) -> Result<(DataType, IpcField)> {
+    let children = field
+        .children()?
+        .ok_or_else(|| Error::oos("IPC: List must contain children"))?;
+    let inner = children
+        .get(0)
+        .ok_or_else(|| Error::oos("IPC: List must contain one child"))??;
+    let (field, ipc_field) = deserialize_field(inner)?;
+
+    Ok((
+        DataType::LargeList(Box::new(field)),
+        IpcField {
+            fields: vec![ipc_field],
+            dictionary_id: None,
+        },
+    ))
+}
+
+fn deserialize_fixed_size_list(
+    list: FixedSizeListRef,
+    field: FieldRef,
+) -> Result<(DataType, IpcField)> {
+    let children = field
+        .children()?
+        .ok_or_else(|| Error::oos("IPC: FixedSizeList must contain children"))?;
+    let inner = children
+        .get(0)
+        .ok_or_else(|| Error::oos("IPC: FixedSizeList must contain one child"))??;
+    let (field, ipc_field) = deserialize_field(inner)?;
+
+    let size = list
+        .list_size()?
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    Ok((
+        DataType::FixedSizeList(Box::new(field), size),
+        IpcField {
+            fields: vec![ipc_field],
+            dictionary_id: None,
+        },
+    ))
+}
+
+/// Get the Arrow data type from the flatbuffer Field table
+fn get_data_type(
+    field: arrow_format::ipc::FieldRef,
+    extension: Extension,
+    may_be_dictionary: bool,
+) -> Result<(DataType, IpcField)> {
+    if let Some(dictionary) = field.dictionary()? {
+        if may_be_dictionary {
+            let int = dictionary
+                .index_type()?
+                .ok_or_else(|| Error::oos("indexType is mandatory in Dictionary."))?;
+            let index_type = deserialize_integer(int)?;
+            let (inner, mut ipc_field) = get_data_type(field, extension, false)?;
+            ipc_field.dictionary_id = Some(dictionary.id()?);
+            return Ok((
+                DataType::Dictionary(index_type, Box::new(inner), dictionary.is_ordered()?),
+                ipc_field,
+            ));
+        }
+    }
+
+    if let Some(extension) = extension {
+        let (name, metadata) = extension;
+        let (data_type, fields) = get_data_type(field, None, false)?;
+        return Ok((
+            DataType::Extension(name, Box::new(data_type), metadata),
+            fields,
+        ));
+    }
+
+    let type_ = field
+        .type_()?
+        .ok_or_else(|| Error::oos("IPC: field type is mandatory"))?;
+
+    use arrow_format::ipc::TypeRef::*;
+    Ok(match type_ {
+        Null(_) => (DataType::Null, IpcField::default()),
+        Bool(_) => (DataType::Boolean, IpcField::default()),
+        Int(int) => {
+            let data_type = deserialize_integer(int)?.into();
+            (data_type, IpcField::default())
+        },
+        Binary(_) => (DataType::Binary, IpcField::default()),
+        LargeBinary(_) => (DataType::LargeBinary, IpcField::default()),
+        Utf8(_) => (DataType::Utf8, IpcField::default()),
+        LargeUtf8(_) => (DataType::LargeUtf8, IpcField::default()),
+        FixedSizeBinary(fixed) => (
+            DataType::FixedSizeBinary(
+                fixed
+                    .byte_width()?
+                    .try_into()
+                    .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?,
+            ),
+            IpcField::default(),
+        ),
+        FloatingPoint(float) => {
+            let data_type = match float.precision()? {
+                arrow_format::ipc::Precision::Half => DataType::Float16,
+                arrow_format::ipc::Precision::Single => DataType::Float32,
+                arrow_format::ipc::Precision::Double => DataType::Float64,
+            };
+            (data_type, IpcField::default())
+        },
+        Date(date) => {
+            let data_type = match date.unit()? {
+                arrow_format::ipc::DateUnit::Day => DataType::Date32,
+                arrow_format::ipc::DateUnit::Millisecond => DataType::Date64,
+            };
+            (data_type, IpcField::default())
+        },
+        Time(time) => deserialize_time(time)?,
+        Timestamp(timestamp) => deserialize_timestamp(timestamp)?,
+        Interval(interval) => {
+            let data_type = match interval.unit()? {
+                arrow_format::ipc::IntervalUnit::YearMonth => {
+                    DataType::Interval(IntervalUnit::YearMonth)
+                },
+                arrow_format::ipc::IntervalUnit::DayTime => {
+                    DataType::Interval(IntervalUnit::DayTime)
+                },
+                arrow_format::ipc::IntervalUnit::MonthDayNano => {
+                    DataType::Interval(IntervalUnit::MonthDayNano)
+                },
+            };
+            (data_type, IpcField::default())
+        },
+        Duration(duration) => {
+            let time_unit = deserialize_timeunit(duration.unit()?)?;
+            (DataType::Duration(time_unit), IpcField::default())
+        },
+        Decimal(decimal) => {
+            let bit_width: usize = decimal
+                .bit_width()?
+                .try_into()
+                .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+            let precision: usize = decimal
+                .precision()?
+                .try_into()
+                .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+            let scale: usize = decimal
+                .scale()?
+                .try_into()
+                .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+            let data_type = match bit_width {
+                128 => DataType::Decimal(precision, scale),
+                256 => DataType::Decimal256(precision, scale),
+                _ => return Err(Error::from(OutOfSpecKind::NegativeFooterLength)),
+            };
+
+            (data_type, IpcField::default())
+        },
+        List(_) => deserialize_list(field)?,
+        LargeList(_) => deserialize_large_list(field)?,
+        FixedSizeList(list) => deserialize_fixed_size_list(list, field)?,
+        Struct(_) => deserialize_struct(field)?,
+        Union(union_) => deserialize_union(union_, field)?,
+        Map(map) => deserialize_map(map, field)?,
+    })
+}
+
+/// Deserialize an flatbuffers-encoded Schema message into [`Schema`] and [`IpcSchema`].
+pub fn deserialize_schema(message: &[u8]) -> Result<(Schema, IpcSchema)> {
+    let message = arrow_format::ipc::MessageRef::read_as_root(message)
+        .map_err(|err| Error::oos(format!("Unable deserialize message: {err:?}")))?;
+
+    let schema = match message
+        .header()?
+        .ok_or_else(|| Error::oos("Unable to convert header to a schema".to_string()))?
+    {
+        arrow_format::ipc::MessageHeaderRef::Schema(schema) => Ok(schema),
+        _ => Err(Error::nyi("The message is expected to be a Schema message")),
+    }?;
+
+    fb_to_schema(schema)
+}
+
+/// Deserialize the raw Schema table from IPC format to Schema data type
+pub(super) fn fb_to_schema(schema: arrow_format::ipc::SchemaRef) -> Result<(Schema, IpcSchema)> {
+    let fields = schema
+        .fields()?
+        .ok_or_else(|| Error::from(OutOfSpecKind::MissingFields))?;
+    let (fields, ipc_fields) = try_unzip_vec(fields.iter().map(|field| {
+        let (field, fields) = deserialize_field(field?)?;
+        Ok((field, fields))
+    }))?;
+
+    let is_little_endian = match schema.endianness()? {
+        arrow_format::ipc::Endianness::Little => true,
+        arrow_format::ipc::Endianness::Big => false,
+    };
+
+    let mut metadata = Metadata::default();
+    if let Some(md_fields) = schema.custom_metadata()? {
+        for kv in md_fields {
+            let kv = kv?;
+            let k_str = kv.key()?;
+            let v_str = kv.value()?;
+            if let Some(k) = k_str {
+                if let Some(v) = v_str {
+                    metadata.insert(k.to_string(), v.to_string());
+                }
+            }
+        }
+    }
+
+    Ok((
+        Schema { fields, metadata },
+        IpcSchema {
+            fields: ipc_fields,
+            is_little_endian,
+        },
+    ))
+}
+
+pub(super) fn deserialize_stream_metadata(meta: &[u8]) -> Result<StreamMetadata> {
+    let message = arrow_format::ipc::MessageRef::read_as_root(meta)
+        .map_err(|err| Error::OutOfSpec(format!("Unable to get root as message: {err:?}")))?;
+    let version = message.version()?;
+    // message header is a Schema, so read it
+    let header = message
+        .header()?
+        .ok_or_else(|| Error::oos("Unable to read the first IPC message"))?;
+    let schema = if let arrow_format::ipc::MessageHeaderRef::Schema(schema) = header {
+        schema
+    } else {
+        return Err(Error::oos(
+            "The first IPC message of the stream must be a schema",
+        ));
+    };
+    let (schema, ipc_schema) = fb_to_schema(schema)?;
+
+    Ok(StreamMetadata {
+        schema,
+        version,
+        ipc_schema,
+    })
+}
diff --git a/crates/nano-arrow/src/io/ipc/read/stream.rs b/crates/nano-arrow/src/io/ipc/read/stream.rs
new file mode 100644
index 000000000000..848bf5acb938
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/stream.rs
@@ -0,0 +1,318 @@
+use std::io::Read;
+
+use ahash::AHashMap;
+use arrow_format;
+use arrow_format::ipc::planus::ReadAsRoot;
+
+use super::super::CONTINUATION_MARKER;
+use super::common::*;
+use super::schema::deserialize_stream_metadata;
+use super::{Dictionaries, OutOfSpecKind};
+use crate::array::Array;
+use crate::chunk::Chunk;
+use crate::datatypes::Schema;
+use crate::error::{Error, Result};
+use crate::io::ipc::IpcSchema;
+
+/// Metadata of an Arrow IPC stream, written at the start of the stream
+#[derive(Debug, Clone)]
+pub struct StreamMetadata {
+    /// The schema that is read from the stream's first message
+    pub schema: Schema,
+
+    /// The IPC version of the stream
+    pub version: arrow_format::ipc::MetadataVersion,
+
+    /// The IPC fields tracking dictionaries
+    pub ipc_schema: IpcSchema,
+}
+
+/// Reads the metadata of the stream
+pub fn read_stream_metadata<R: Read>(reader: &mut R) -> Result<StreamMetadata> {
+    // determine metadata length
+    let mut meta_size: [u8; 4] = [0; 4];
+    reader.read_exact(&mut meta_size)?;
+    let meta_length = {
+        // If a continuation marker is encountered, skip over it and read
+        // the size from the next four bytes.
+        if meta_size == CONTINUATION_MARKER {
+            reader.read_exact(&mut meta_size)?;
+        }
+        i32::from_le_bytes(meta_size)
+    };
+
+    let length: usize = meta_length
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let mut buffer = vec![];
+    buffer.try_reserve(length)?;
+    reader
+        .by_ref()
+        .take(length as u64)
+        .read_to_end(&mut buffer)?;
+
+    deserialize_stream_metadata(&buffer)
+}
+
+/// Encodes the stream's status after each read.
+///
+/// A stream is an iterator, and an iterator returns `Option<Item>`. The `Item`
+/// type in the [`StreamReader`] case is `StreamState`, which means that an Arrow
+/// stream may yield one of three values: (1) `None`, which signals that the stream
+/// is done; (2) [`StreamState::Some`], which signals that there was
+/// data waiting in the stream and we read it; and finally (3)
+/// [`Some(StreamState::Waiting)`], which means that the stream is still "live", it
+/// just doesn't hold any data right now.
+pub enum StreamState {
+    /// A live stream without data
+    Waiting,
+    /// Next item in the stream
+    Some(Chunk<Box<dyn Array>>),
+}
+
+impl StreamState {
+    /// Return the data inside this wrapper.
+    ///
+    /// # Panics
+    ///
+    /// If the `StreamState` was `Waiting`.
+    pub fn unwrap(self) -> Chunk<Box<dyn Array>> {
+        if let StreamState::Some(batch) = self {
+            batch
+        } else {
+            panic!("The batch is not available")
+        }
+    }
+}
+
+/// Reads the next item, yielding `None` if the stream is done,
+/// and a [`StreamState`] otherwise.
+fn read_next<R: Read>(
+    reader: &mut R,
+    metadata: &StreamMetadata,
+    dictionaries: &mut Dictionaries,
+    message_buffer: &mut Vec<u8>,
+    data_buffer: &mut Vec<u8>,
+    projection: &Option<(Vec<usize>, AHashMap<usize, usize>, Schema)>,
+    scratch: &mut Vec<u8>,
+) -> Result<Option<StreamState>> {
+    // determine metadata length
+    let mut meta_length: [u8; 4] = [0; 4];
+
+    match reader.read_exact(&mut meta_length) {
+        Ok(()) => (),
+        Err(e) => {
+            return if e.kind() == std::io::ErrorKind::UnexpectedEof {
+                // Handle EOF without the "0xFFFFFFFF 0x00000000"
+                // valid according to:
+                // https://arrow.apache.org/docs/format/Columnar.html#ipc-streaming-format
+                Ok(Some(StreamState::Waiting))
+            } else {
+                Err(Error::from(e))
+            };
+        },
+    }
+
+    let meta_length = {
+        // If a continuation marker is encountered, skip over it and read
+        // the size from the next four bytes.
+        if meta_length == CONTINUATION_MARKER {
+            reader.read_exact(&mut meta_length)?;
+        }
+        i32::from_le_bytes(meta_length)
+    };
+
+    let meta_length: usize = meta_length
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    if meta_length == 0 {
+        // the stream has ended, mark the reader as finished
+        return Ok(None);
+    }
+
+    message_buffer.clear();
+    message_buffer.try_reserve(meta_length)?;
+    reader
+        .by_ref()
+        .take(meta_length as u64)
+        .read_to_end(message_buffer)?;
+
+    let message = arrow_format::ipc::MessageRef::read_as_root(message_buffer.as_ref())
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferMessage(err)))?;
+
+    let header = message
+        .header()
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferHeader(err)))?
+        .ok_or_else(|| Error::from(OutOfSpecKind::MissingMessageHeader))?;
+
+    let block_length: usize = message
+        .body_length()
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferBodyLength(err)))?
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::UnexpectedNegativeInteger))?;
+
+    match header {
+        arrow_format::ipc::MessageHeaderRef::RecordBatch(batch) => {
+            data_buffer.clear();
+            data_buffer.try_reserve(block_length)?;
+            reader
+                .by_ref()
+                .take(block_length as u64)
+                .read_to_end(data_buffer)?;
+
+            let file_size = data_buffer.len() as u64;
+
+            let mut reader = std::io::Cursor::new(data_buffer);
+
+            let chunk = read_record_batch(
+                batch,
+                &metadata.schema.fields,
+                &metadata.ipc_schema,
+                projection.as_ref().map(|x| x.0.as_ref()),
+                None,
+                dictionaries,
+                metadata.version,
+                &mut reader,
+                0,
+                file_size,
+                scratch,
+            );
+
+            if let Some((_, map, _)) = projection {
+                // re-order according to projection
+                chunk
+                    .map(|chunk| apply_projection(chunk, map))
+                    .map(|x| Some(StreamState::Some(x)))
+            } else {
+                chunk.map(|x| Some(StreamState::Some(x)))
+            }
+        },
+        arrow_format::ipc::MessageHeaderRef::DictionaryBatch(batch) => {
+            data_buffer.clear();
+            data_buffer.try_reserve(block_length)?;
+            reader
+                .by_ref()
+                .take(block_length as u64)
+                .read_to_end(data_buffer)?;
+
+            let file_size = data_buffer.len() as u64;
+            let mut dict_reader = std::io::Cursor::new(&data_buffer);
+
+            read_dictionary(
+                batch,
+                &metadata.schema.fields,
+                &metadata.ipc_schema,
+                dictionaries,
+                &mut dict_reader,
+                0,
+                file_size,
+                scratch,
+            )?;
+
+            // read the next message until we encounter a RecordBatch message
+            read_next(
+                reader,
+                metadata,
+                dictionaries,
+                message_buffer,
+                data_buffer,
+                projection,
+                scratch,
+            )
+        },
+        _ => Err(Error::from(OutOfSpecKind::UnexpectedMessageType)),
+    }
+}
+
+/// Arrow Stream reader.
+///
+/// An [`Iterator`] over an Arrow stream that yields a result of [`StreamState`]s.
+/// This is the recommended way to read an arrow stream (by iterating over its data).
+///
+/// For a more thorough walkthrough consult [this example](https://github.com/jorgecarleitao/arrow2/tree/main/examples/ipc_pyarrow).
+pub struct StreamReader<R: Read> {
+    reader: R,
+    metadata: StreamMetadata,
+    dictionaries: Dictionaries,
+    finished: bool,
+    data_buffer: Vec<u8>,
+    message_buffer: Vec<u8>,
+    projection: Option<(Vec<usize>, AHashMap<usize, usize>, Schema)>,
+    scratch: Vec<u8>,
+}
+
+impl<R: Read> StreamReader<R> {
+    /// Try to create a new stream reader
+    ///
+    /// The first message in the stream is the schema, the reader will fail if it does not
+    /// encounter a schema.
+    /// To check if the reader is done, use `is_finished(self)`
+    pub fn new(reader: R, metadata: StreamMetadata, projection: Option<Vec<usize>>) -> Self {
+        let projection = projection.map(|projection| {
+            let (p, h, fields) = prepare_projection(&metadata.schema.fields, projection);
+            let schema = Schema {
+                fields,
+                metadata: metadata.schema.metadata.clone(),
+            };
+            (p, h, schema)
+        });
+
+        Self {
+            reader,
+            metadata,
+            dictionaries: Default::default(),
+            finished: false,
+            data_buffer: Default::default(),
+            message_buffer: Default::default(),
+            projection,
+            scratch: Default::default(),
+        }
+    }
+
+    /// Return the schema of the stream
+    pub fn metadata(&self) -> &StreamMetadata {
+        &self.metadata
+    }
+
+    /// Return the schema of the file
+    pub fn schema(&self) -> &Schema {
+        self.projection
+            .as_ref()
+            .map(|x| &x.2)
+            .unwrap_or(&self.metadata.schema)
+    }
+
+    /// Check if the stream is finished
+    pub fn is_finished(&self) -> bool {
+        self.finished
+    }
+
+    fn maybe_next(&mut self) -> Result<Option<StreamState>> {
+        if self.finished {
+            return Ok(None);
+        }
+        let batch = read_next(
+            &mut self.reader,
+            &self.metadata,
+            &mut self.dictionaries,
+            &mut self.message_buffer,
+            &mut self.data_buffer,
+            &self.projection,
+            &mut self.scratch,
+        )?;
+        if batch.is_none() {
+            self.finished = true;
+        }
+        Ok(batch)
+    }
+}
+
+impl<R: Read> Iterator for StreamReader<R> {
+    type Item = Result<StreamState>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        self.maybe_next().transpose()
+    }
+}
diff --git a/crates/nano-arrow/src/io/ipc/read/stream_async.rs b/crates/nano-arrow/src/io/ipc/read/stream_async.rs
new file mode 100644
index 000000000000..f87f84a8d317
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/read/stream_async.rs
@@ -0,0 +1,237 @@
+//! APIs to read Arrow streams asynchronously
+
+use arrow_format::ipc::planus::ReadAsRoot;
+use futures::future::BoxFuture;
+use futures::{AsyncRead, AsyncReadExt, FutureExt, Stream};
+
+use super::super::CONTINUATION_MARKER;
+use super::common::{read_dictionary, read_record_batch};
+use super::schema::deserialize_stream_metadata;
+use super::{Dictionaries, OutOfSpecKind, StreamMetadata};
+use crate::array::*;
+use crate::chunk::Chunk;
+use crate::error::{Error, Result};
+
+/// A (private) state of stream messages
+struct ReadState<R> {
+    pub reader: R,
+    pub metadata: StreamMetadata,
+    pub dictionaries: Dictionaries,
+    /// The internal buffer to read data inside the messages (records and dictionaries) to
+    pub data_buffer: Vec<u8>,
+    /// The internal buffer to read messages to
+    pub message_buffer: Vec<u8>,
+}
+
+/// The state of an Arrow stream
+enum StreamState<R> {
+    /// The stream does not contain new chunks (and it has not been closed)
+    Waiting(ReadState<R>),
+    /// The stream contain a new chunk
+    Some((ReadState<R>, Chunk<Box<dyn Array>>)),
+}
+
+/// Reads the [`StreamMetadata`] of the Arrow stream asynchronously
+pub async fn read_stream_metadata_async<R: AsyncRead + Unpin + Send>(
+    reader: &mut R,
+) -> Result<StreamMetadata> {
+    // determine metadata length
+    let mut meta_size: [u8; 4] = [0; 4];
+    reader.read_exact(&mut meta_size).await?;
+    let meta_len = {
+        // If a continuation marker is encountered, skip over it and read
+        // the size from the next four bytes.
+        if meta_size == CONTINUATION_MARKER {
+            reader.read_exact(&mut meta_size).await?;
+        }
+        i32::from_le_bytes(meta_size)
+    };
+
+    let meta_len: usize = meta_len
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let mut meta_buffer = vec![];
+    meta_buffer.try_reserve(meta_len)?;
+    reader
+        .take(meta_len as u64)
+        .read_to_end(&mut meta_buffer)
+        .await?;
+
+    deserialize_stream_metadata(&meta_buffer)
+}
+
+/// Reads the next item, yielding `None` if the stream has been closed,
+/// or a [`StreamState`] otherwise.
+async fn maybe_next<R: AsyncRead + Unpin + Send>(
+    mut state: ReadState<R>,
+) -> Result<Option<StreamState<R>>> {
+    let mut scratch = Default::default();
+    // determine metadata length
+    let mut meta_length: [u8; 4] = [0; 4];
+
+    match state.reader.read_exact(&mut meta_length).await {
+        Ok(()) => (),
+        Err(e) => {
+            return if e.kind() == std::io::ErrorKind::UnexpectedEof {
+                // Handle EOF without the "0xFFFFFFFF 0x00000000"
+                // valid according to:
+                // https://arrow.apache.org/docs/format/Columnar.html#ipc-streaming-format
+                Ok(Some(StreamState::Waiting(state)))
+            } else {
+                Err(Error::from(e))
+            };
+        },
+    }
+
+    let meta_length = {
+        // If a continuation marker is encountered, skip over it and read
+        // the size from the next four bytes.
+        if meta_length == CONTINUATION_MARKER {
+            state.reader.read_exact(&mut meta_length).await?;
+        }
+        i32::from_le_bytes(meta_length)
+    };
+
+    let meta_length: usize = meta_length
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    if meta_length == 0 {
+        // the stream has ended, mark the reader as finished
+        return Ok(None);
+    }
+
+    state.message_buffer.clear();
+    state.message_buffer.try_reserve(meta_length)?;
+    (&mut state.reader)
+        .take(meta_length as u64)
+        .read_to_end(&mut state.message_buffer)
+        .await?;
+
+    let message = arrow_format::ipc::MessageRef::read_as_root(state.message_buffer.as_ref())
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferMessage(err)))?;
+
+    let header = message
+        .header()
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferHeader(err)))?
+        .ok_or_else(|| Error::from(OutOfSpecKind::MissingMessageHeader))?;
+
+    let block_length: usize = message
+        .body_length()
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferBodyLength(err)))?
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::UnexpectedNegativeInteger))?;
+
+    match header {
+        arrow_format::ipc::MessageHeaderRef::RecordBatch(batch) => {
+            state.data_buffer.clear();
+            state.data_buffer.try_reserve(block_length)?;
+            (&mut state.reader)
+                .take(block_length as u64)
+                .read_to_end(&mut state.data_buffer)
+                .await?;
+
+            read_record_batch(
+                batch,
+                &state.metadata.schema.fields,
+                &state.metadata.ipc_schema,
+                None,
+                None,
+                &state.dictionaries,
+                state.metadata.version,
+                &mut std::io::Cursor::new(&state.data_buffer),
+                0,
+                state.data_buffer.len() as u64,
+                &mut scratch,
+            )
+            .map(|chunk| Some(StreamState::Some((state, chunk))))
+        },
+        arrow_format::ipc::MessageHeaderRef::DictionaryBatch(batch) => {
+            state.data_buffer.clear();
+            state.data_buffer.try_reserve(block_length)?;
+            (&mut state.reader)
+                .take(block_length as u64)
+                .read_to_end(&mut state.data_buffer)
+                .await?;
+
+            let file_size = state.data_buffer.len() as u64;
+
+            let mut dict_reader = std::io::Cursor::new(&state.data_buffer);
+
+            read_dictionary(
+                batch,
+                &state.metadata.schema.fields,
+                &state.metadata.ipc_schema,
+                &mut state.dictionaries,
+                &mut dict_reader,
+                0,
+                file_size,
+                &mut scratch,
+            )?;
+
+            // read the next message until we encounter a Chunk<Box<dyn Array>> message
+            Ok(Some(StreamState::Waiting(state)))
+        },
+        _ => Err(Error::from(OutOfSpecKind::UnexpectedMessageType)),
+    }
+}
+
+/// A [`Stream`] over an Arrow IPC stream that asynchronously yields [`Chunk`]s.
+pub struct AsyncStreamReader<'a, R: AsyncRead + Unpin + Send + 'a> {
+    metadata: StreamMetadata,
+    future: Option<BoxFuture<'a, Result<Option<StreamState<R>>>>>,
+}
+
+impl<'a, R: AsyncRead + Unpin + Send + 'a> AsyncStreamReader<'a, R> {
+    /// Creates a new [`AsyncStreamReader`]
+    pub fn new(reader: R, metadata: StreamMetadata) -> Self {
+        let state = ReadState {
+            reader,
+            metadata: metadata.clone(),
+            dictionaries: Default::default(),
+            data_buffer: Default::default(),
+            message_buffer: Default::default(),
+        };
+        let future = Some(maybe_next(state).boxed());
+        Self { metadata, future }
+    }
+
+    /// Return the schema of the stream
+    pub fn metadata(&self) -> &StreamMetadata {
+        &self.metadata
+    }
+}
+
+impl<'a, R: AsyncRead + Unpin + Send> Stream for AsyncStreamReader<'a, R> {
+    type Item = Result<Chunk<Box<dyn Array>>>;
+
+    fn poll_next(
+        self: std::pin::Pin<&mut Self>,
+        cx: &mut std::task::Context<'_>,
+    ) -> std::task::Poll<Option<Self::Item>> {
+        use std::pin::Pin;
+        use std::task::Poll;
+        let me = Pin::into_inner(self);
+
+        match &mut me.future {
+            Some(fut) => match fut.as_mut().poll(cx) {
+                Poll::Ready(Ok(None)) => {
+                    me.future = None;
+                    Poll::Ready(None)
+                },
+                Poll::Ready(Ok(Some(StreamState::Some((state, batch))))) => {
+                    me.future = Some(Box::pin(maybe_next(state)));
+                    Poll::Ready(Some(Ok(batch)))
+                },
+                Poll::Ready(Ok(Some(StreamState::Waiting(_)))) => Poll::Pending,
+                Poll::Ready(Err(err)) => {
+                    me.future = None;
+                    Poll::Ready(Some(Err(err)))
+                },
+                Poll::Pending => Poll::Pending,
+            },
+            None => Poll::Ready(None),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/io/ipc/write/common.rs b/crates/nano-arrow/src/io/ipc/write/common.rs
new file mode 100644
index 000000000000..4684bd7f658d
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/write/common.rs
@@ -0,0 +1,448 @@
+use std::borrow::{Borrow, Cow};
+
+use arrow_format::ipc::planus::Builder;
+
+use super::super::IpcField;
+use super::{write, write_dictionary};
+use crate::array::*;
+use crate::chunk::Chunk;
+use crate::datatypes::*;
+use crate::error::{Error, Result};
+use crate::io::ipc::endianness::is_native_little_endian;
+use crate::io::ipc::read::Dictionaries;
+
+/// Compression codec
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Hash)]
+pub enum Compression {
+    /// LZ4 (framed)
+    LZ4,
+    /// ZSTD
+    ZSTD,
+}
+
+/// Options declaring the behaviour of writing to IPC
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Hash, Default)]
+pub struct WriteOptions {
+    /// Whether the buffers should be compressed and which codec to use.
+    /// Note: to use compression the crate must be compiled with feature `io_ipc_compression`.
+    pub compression: Option<Compression>,
+}
+
+fn encode_dictionary(
+    field: &IpcField,
+    array: &dyn Array,
+    options: &WriteOptions,
+    dictionary_tracker: &mut DictionaryTracker,
+    encoded_dictionaries: &mut Vec<EncodedData>,
+) -> Result<()> {
+    use PhysicalType::*;
+    match array.data_type().to_physical_type() {
+        Utf8 | LargeUtf8 | Binary | LargeBinary | Primitive(_) | Boolean | Null
+        | FixedSizeBinary => Ok(()),
+        Dictionary(key_type) => match_integer_type!(key_type, |$T| {
+            let dict_id = field.dictionary_id
+                .ok_or_else(|| Error::InvalidArgumentError("Dictionaries must have an associated id".to_string()))?;
+
+            let emit = dictionary_tracker.insert(dict_id, array)?;
+
+            let array = array.as_any().downcast_ref::<DictionaryArray<$T>>().unwrap();
+            let values = array.values();
+            encode_dictionary(field,
+                values.as_ref(),
+                options,
+                dictionary_tracker,
+                encoded_dictionaries
+            )?;
+
+            if emit {
+                encoded_dictionaries.push(dictionary_batch_to_bytes::<$T>(
+                    dict_id,
+                    array,
+                    options,
+                    is_native_little_endian(),
+                ));
+            };
+            Ok(())
+        }),
+        Struct => {
+            let array = array.as_any().downcast_ref::<StructArray>().unwrap();
+            let fields = field.fields.as_slice();
+            if array.fields().len() != fields.len() {
+                return Err(Error::InvalidArgumentError(
+                    "The number of fields in a struct must equal the number of children in IpcField".to_string(),
+                ));
+            }
+            fields
+                .iter()
+                .zip(array.values().iter())
+                .try_for_each(|(field, values)| {
+                    encode_dictionary(
+                        field,
+                        values.as_ref(),
+                        options,
+                        dictionary_tracker,
+                        encoded_dictionaries,
+                    )
+                })
+        },
+        List => {
+            let values = array
+                .as_any()
+                .downcast_ref::<ListArray<i32>>()
+                .unwrap()
+                .values();
+            let field = &field.fields[0]; // todo: error instead
+            encode_dictionary(
+                field,
+                values.as_ref(),
+                options,
+                dictionary_tracker,
+                encoded_dictionaries,
+            )
+        },
+        LargeList => {
+            let values = array
+                .as_any()
+                .downcast_ref::<ListArray<i64>>()
+                .unwrap()
+                .values();
+            let field = &field.fields[0]; // todo: error instead
+            encode_dictionary(
+                field,
+                values.as_ref(),
+                options,
+                dictionary_tracker,
+                encoded_dictionaries,
+            )
+        },
+        FixedSizeList => {
+            let values = array
+                .as_any()
+                .downcast_ref::<FixedSizeListArray>()
+                .unwrap()
+                .values();
+            let field = &field.fields[0]; // todo: error instead
+            encode_dictionary(
+                field,
+                values.as_ref(),
+                options,
+                dictionary_tracker,
+                encoded_dictionaries,
+            )
+        },
+        Union => {
+            let values = array
+                .as_any()
+                .downcast_ref::<UnionArray>()
+                .unwrap()
+                .fields();
+            let fields = &field.fields[..]; // todo: error instead
+            if values.len() != fields.len() {
+                return Err(Error::InvalidArgumentError(
+                    "The number of fields in a union must equal the number of children in IpcField"
+                        .to_string(),
+                ));
+            }
+            fields
+                .iter()
+                .zip(values.iter())
+                .try_for_each(|(field, values)| {
+                    encode_dictionary(
+                        field,
+                        values.as_ref(),
+                        options,
+                        dictionary_tracker,
+                        encoded_dictionaries,
+                    )
+                })
+        },
+        Map => {
+            let values = array.as_any().downcast_ref::<MapArray>().unwrap().field();
+            let field = &field.fields[0]; // todo: error instead
+            encode_dictionary(
+                field,
+                values.as_ref(),
+                options,
+                dictionary_tracker,
+                encoded_dictionaries,
+            )
+        },
+    }
+}
+
+pub fn encode_chunk(
+    chunk: &Chunk<Box<dyn Array>>,
+    fields: &[IpcField],
+    dictionary_tracker: &mut DictionaryTracker,
+    options: &WriteOptions,
+) -> Result<(Vec<EncodedData>, EncodedData)> {
+    let mut encoded_message = EncodedData::default();
+    let encoded_dictionaries = encode_chunk_amortized(
+        chunk,
+        fields,
+        dictionary_tracker,
+        options,
+        &mut encoded_message,
+    )?;
+    Ok((encoded_dictionaries, encoded_message))
+}
+
+// Amortizes `EncodedData` allocation.
+pub fn encode_chunk_amortized(
+    chunk: &Chunk<Box<dyn Array>>,
+    fields: &[IpcField],
+    dictionary_tracker: &mut DictionaryTracker,
+    options: &WriteOptions,
+    encoded_message: &mut EncodedData,
+) -> Result<Vec<EncodedData>> {
+    let mut encoded_dictionaries = vec![];
+
+    for (field, array) in fields.iter().zip(chunk.as_ref()) {
+        encode_dictionary(
+            field,
+            array.as_ref(),
+            options,
+            dictionary_tracker,
+            &mut encoded_dictionaries,
+        )?;
+    }
+
+    chunk_to_bytes_amortized(chunk, options, encoded_message);
+
+    Ok(encoded_dictionaries)
+}
+
+fn serialize_compression(
+    compression: Option<Compression>,
+) -> Option<Box<arrow_format::ipc::BodyCompression>> {
+    if let Some(compression) = compression {
+        let codec = match compression {
+            Compression::LZ4 => arrow_format::ipc::CompressionType::Lz4Frame,
+            Compression::ZSTD => arrow_format::ipc::CompressionType::Zstd,
+        };
+        Some(Box::new(arrow_format::ipc::BodyCompression {
+            codec,
+            method: arrow_format::ipc::BodyCompressionMethod::Buffer,
+        }))
+    } else {
+        None
+    }
+}
+
+/// Write [`Chunk`] into two sets of bytes, one for the header (ipc::Schema::Message) and the
+/// other for the batch's data
+fn chunk_to_bytes_amortized(
+    chunk: &Chunk<Box<dyn Array>>,
+    options: &WriteOptions,
+    encoded_message: &mut EncodedData,
+) {
+    let mut nodes: Vec<arrow_format::ipc::FieldNode> = vec![];
+    let mut buffers: Vec<arrow_format::ipc::Buffer> = vec![];
+    let mut arrow_data = std::mem::take(&mut encoded_message.arrow_data);
+    arrow_data.clear();
+
+    let mut offset = 0;
+    for array in chunk.arrays() {
+        write(
+            array.as_ref(),
+            &mut buffers,
+            &mut arrow_data,
+            &mut nodes,
+            &mut offset,
+            is_native_little_endian(),
+            options.compression,
+        )
+    }
+
+    let compression = serialize_compression(options.compression);
+
+    let message = arrow_format::ipc::Message {
+        version: arrow_format::ipc::MetadataVersion::V5,
+        header: Some(arrow_format::ipc::MessageHeader::RecordBatch(Box::new(
+            arrow_format::ipc::RecordBatch {
+                length: chunk.len() as i64,
+                nodes: Some(nodes),
+                buffers: Some(buffers),
+                compression,
+            },
+        ))),
+        body_length: arrow_data.len() as i64,
+        custom_metadata: None,
+    };
+
+    let mut builder = Builder::new();
+    let ipc_message = builder.finish(&message, None);
+    encoded_message.ipc_message = ipc_message.to_vec();
+    encoded_message.arrow_data = arrow_data
+}
+
+/// Write dictionary values into two sets of bytes, one for the header (ipc::Schema::Message) and the
+/// other for the data
+fn dictionary_batch_to_bytes<K: DictionaryKey>(
+    dict_id: i64,
+    array: &DictionaryArray<K>,
+    options: &WriteOptions,
+    is_little_endian: bool,
+) -> EncodedData {
+    let mut nodes: Vec<arrow_format::ipc::FieldNode> = vec![];
+    let mut buffers: Vec<arrow_format::ipc::Buffer> = vec![];
+    let mut arrow_data: Vec<u8> = vec![];
+
+    let length = write_dictionary(
+        array,
+        &mut buffers,
+        &mut arrow_data,
+        &mut nodes,
+        &mut 0,
+        is_little_endian,
+        options.compression,
+        false,
+    );
+
+    let compression = serialize_compression(options.compression);
+
+    let message = arrow_format::ipc::Message {
+        version: arrow_format::ipc::MetadataVersion::V5,
+        header: Some(arrow_format::ipc::MessageHeader::DictionaryBatch(Box::new(
+            arrow_format::ipc::DictionaryBatch {
+                id: dict_id,
+                data: Some(Box::new(arrow_format::ipc::RecordBatch {
+                    length: length as i64,
+                    nodes: Some(nodes),
+                    buffers: Some(buffers),
+                    compression,
+                })),
+                is_delta: false,
+            },
+        ))),
+        body_length: arrow_data.len() as i64,
+        custom_metadata: None,
+    };
+
+    let mut builder = Builder::new();
+    let ipc_message = builder.finish(&message, None);
+
+    EncodedData {
+        ipc_message: ipc_message.to_vec(),
+        arrow_data,
+    }
+}
+
+/// Keeps track of dictionaries that have been written, to avoid emitting the same dictionary
+/// multiple times. Can optionally error if an update to an existing dictionary is attempted, which
+/// isn't allowed in the `FileWriter`.
+pub struct DictionaryTracker {
+    pub dictionaries: Dictionaries,
+    pub cannot_replace: bool,
+}
+
+impl DictionaryTracker {
+    /// Keep track of the dictionary with the given ID and values. Behavior:
+    ///
+    /// * If this ID has been written already and has the same data, return `Ok(false)` to indicate
+    ///   that the dictionary was not actually inserted (because it's already been seen).
+    /// * If this ID has been written already but with different data, and this tracker is
+    ///   configured to return an error, return an error.
+    /// * If the tracker has not been configured to error on replacement or this dictionary
+    ///   has never been seen before, return `Ok(true)` to indicate that the dictionary was just
+    ///   inserted.
+    pub fn insert(&mut self, dict_id: i64, array: &dyn Array) -> Result<bool> {
+        let values = match array.data_type() {
+            DataType::Dictionary(key_type, _, _) => {
+                match_integer_type!(key_type, |$T| {
+                    let array = array
+                        .as_any()
+                        .downcast_ref::<DictionaryArray<$T>>()
+                        .unwrap();
+                    array.values()
+                })
+            },
+            _ => unreachable!(),
+        };
+
+        // If a dictionary with this id was already emitted, check if it was the same.
+        if let Some(last) = self.dictionaries.get(&dict_id) {
+            if last.as_ref() == values.as_ref() {
+                // Same dictionary values => no need to emit it again
+                return Ok(false);
+            } else if self.cannot_replace {
+                return Err(Error::InvalidArgumentError(
+                    "Dictionary replacement detected when writing IPC file format. \
+                     Arrow IPC files only support a single dictionary for a given field \
+                     across all batches."
+                        .to_string(),
+                ));
+            }
+        };
+
+        self.dictionaries.insert(dict_id, values.clone());
+        Ok(true)
+    }
+}
+
+/// Stores the encoded data, which is an ipc::Schema::Message, and optional Arrow data
+#[derive(Debug, Default)]
+pub struct EncodedData {
+    /// An encoded ipc::Schema::Message
+    pub ipc_message: Vec<u8>,
+    /// Arrow buffers to be written, should be an empty vec for schema messages
+    pub arrow_data: Vec<u8>,
+}
+
+/// Calculate an 8-byte boundary and return the number of bytes needed to pad to 8 bytes
+#[inline]
+pub(crate) fn pad_to_64(len: usize) -> usize {
+    ((len + 63) & !63) - len
+}
+
+/// An array [`Chunk`] with optional accompanying IPC fields.
+#[derive(Debug, Clone, PartialEq)]
+pub struct Record<'a> {
+    columns: Cow<'a, Chunk<Box<dyn Array>>>,
+    fields: Option<Cow<'a, [IpcField]>>,
+}
+
+impl<'a> Record<'a> {
+    /// Get the IPC fields for this record.
+    pub fn fields(&self) -> Option<&[IpcField]> {
+        self.fields.as_deref()
+    }
+
+    /// Get the Arrow columns in this record.
+    pub fn columns(&self) -> &Chunk<Box<dyn Array>> {
+        self.columns.borrow()
+    }
+}
+
+impl From<Chunk<Box<dyn Array>>> for Record<'static> {
+    fn from(columns: Chunk<Box<dyn Array>>) -> Self {
+        Self {
+            columns: Cow::Owned(columns),
+            fields: None,
+        }
+    }
+}
+
+impl<'a, F> From<(Chunk<Box<dyn Array>>, Option<F>)> for Record<'a>
+where
+    F: Into<Cow<'a, [IpcField]>>,
+{
+    fn from((columns, fields): (Chunk<Box<dyn Array>>, Option<F>)) -> Self {
+        Self {
+            columns: Cow::Owned(columns),
+            fields: fields.map(|f| f.into()),
+        }
+    }
+}
+
+impl<'a, F> From<(&'a Chunk<Box<dyn Array>>, Option<F>)> for Record<'a>
+where
+    F: Into<Cow<'a, [IpcField]>>,
+{
+    fn from((columns, fields): (&'a Chunk<Box<dyn Array>>, Option<F>)) -> Self {
+        Self {
+            columns: Cow::Borrowed(columns),
+            fields: fields.map(|f| f.into()),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/io/ipc/write/common_async.rs b/crates/nano-arrow/src/io/ipc/write/common_async.rs
new file mode 100644
index 000000000000..397391cd24ee
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/write/common_async.rs
@@ -0,0 +1,66 @@
+use futures::{AsyncWrite, AsyncWriteExt};
+
+use super::super::CONTINUATION_MARKER;
+use super::common::{pad_to_64, EncodedData};
+use crate::error::Result;
+
+/// Write a message's IPC data and buffers, returning metadata and buffer data lengths written
+pub async fn write_message<W: AsyncWrite + Unpin + Send>(
+    mut writer: W,
+    encoded: EncodedData,
+) -> Result<(usize, usize)> {
+    let arrow_data_len = encoded.arrow_data.len();
+
+    let a = 64 - 1;
+    let buffer = encoded.ipc_message;
+    let flatbuf_size = buffer.len();
+    let prefix_size = 8; // the message length
+    let aligned_size = (flatbuf_size + prefix_size + a) & !a;
+    let padding_bytes = aligned_size - flatbuf_size - prefix_size;
+
+    write_continuation(&mut writer, (aligned_size - prefix_size) as i32).await?;
+
+    // write the flatbuf
+    if flatbuf_size > 0 {
+        writer.write_all(&buffer).await?;
+    }
+    // write padding
+    writer.write_all(&vec![0; padding_bytes]).await?;
+
+    // write arrow data
+    let body_len = if arrow_data_len > 0 {
+        write_body_buffers(writer, &encoded.arrow_data).await?
+    } else {
+        0
+    };
+
+    Ok((aligned_size, body_len))
+}
+
+/// Write a record batch to the writer, writing the message size before the message
+/// if the record batch is being written to a stream
+pub async fn write_continuation<W: AsyncWrite + Unpin + Send>(
+    mut writer: W,
+    total_len: i32,
+) -> Result<usize> {
+    writer.write_all(&CONTINUATION_MARKER).await?;
+    writer.write_all(&total_len.to_le_bytes()[..]).await?;
+    Ok(8)
+}
+
+async fn write_body_buffers<W: AsyncWrite + Unpin + Send>(
+    mut writer: W,
+    data: &[u8],
+) -> Result<usize> {
+    let len = data.len();
+    let pad_len = pad_to_64(data.len());
+    let total_len = len + pad_len;
+
+    // write body buffer
+    writer.write_all(data).await?;
+    if pad_len > 0 {
+        writer.write_all(&vec![0u8; pad_len][..]).await?;
+    }
+
+    Ok(total_len)
+}
diff --git a/crates/nano-arrow/src/io/ipc/write/common_sync.rs b/crates/nano-arrow/src/io/ipc/write/common_sync.rs
new file mode 100644
index 000000000000..b20196419b2c
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/write/common_sync.rs
@@ -0,0 +1,59 @@
+use std::io::Write;
+
+use super::super::CONTINUATION_MARKER;
+use super::common::{pad_to_64, EncodedData};
+use crate::error::Result;
+
+/// Write a message's IPC data and buffers, returning metadata and buffer data lengths written
+pub fn write_message<W: Write>(writer: &mut W, encoded: &EncodedData) -> Result<(usize, usize)> {
+    let arrow_data_len = encoded.arrow_data.len();
+
+    let a = 8 - 1;
+    let buffer = &encoded.ipc_message;
+    let flatbuf_size = buffer.len();
+    let prefix_size = 8;
+    let aligned_size = (flatbuf_size + prefix_size + a) & !a;
+    let padding_bytes = aligned_size - flatbuf_size - prefix_size;
+
+    write_continuation(writer, (aligned_size - prefix_size) as i32)?;
+
+    // write the flatbuf
+    if flatbuf_size > 0 {
+        writer.write_all(buffer)?;
+    }
+    // write padding
+    // aligned to a 8 byte boundary, so maximum is [u8;8]
+    const PADDING_MAX: [u8; 8] = [0u8; 8];
+    writer.write_all(&PADDING_MAX[..padding_bytes])?;
+
+    // write arrow data
+    let body_len = if arrow_data_len > 0 {
+        write_body_buffers(writer, &encoded.arrow_data)?
+    } else {
+        0
+    };
+
+    Ok((aligned_size, body_len))
+}
+
+fn write_body_buffers<W: Write>(mut writer: W, data: &[u8]) -> Result<usize> {
+    let len = data.len();
+    let pad_len = pad_to_64(data.len());
+    let total_len = len + pad_len;
+
+    // write body buffer
+    writer.write_all(data)?;
+    if pad_len > 0 {
+        writer.write_all(&vec![0u8; pad_len][..])?;
+    }
+
+    Ok(total_len)
+}
+
+/// Write a record batch to the writer, writing the message size before the message
+/// if the record batch is being written to a stream
+pub fn write_continuation<W: Write>(writer: &mut W, total_len: i32) -> Result<usize> {
+    writer.write_all(&CONTINUATION_MARKER)?;
+    writer.write_all(&total_len.to_le_bytes()[..])?;
+    Ok(8)
+}
diff --git a/crates/nano-arrow/src/io/ipc/write/file_async.rs b/crates/nano-arrow/src/io/ipc/write/file_async.rs
new file mode 100644
index 000000000000..93a1715282e2
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/write/file_async.rs
@@ -0,0 +1,252 @@
+//! Async writer for IPC files.
+
+use std::task::Poll;
+
+use arrow_format::ipc::planus::Builder;
+use arrow_format::ipc::{Block, Footer, MetadataVersion};
+use futures::future::BoxFuture;
+use futures::{AsyncWrite, AsyncWriteExt, FutureExt, Sink};
+
+use super::common::{encode_chunk, DictionaryTracker, EncodedData, WriteOptions};
+use super::common_async::{write_continuation, write_message};
+use super::schema::serialize_schema;
+use super::{default_ipc_fields, schema_to_bytes, Record};
+use crate::datatypes::*;
+use crate::error::{Error, Result};
+use crate::io::ipc::{IpcField, ARROW_MAGIC_V2};
+
+type WriteOutput<W> = (usize, Option<Block>, Vec<Block>, Option<W>);
+
+///  Sink that writes array [`chunks`](crate::chunk::Chunk) as an IPC file.
+///
+/// The file header is automatically written before writing the first chunk, and the file footer is
+/// automatically written when the sink is closed.
+///
+/// # Examples
+///
+/// ```
+/// use futures::{SinkExt, TryStreamExt, io::Cursor};
+/// use arrow2::array::{Array, Int32Array};
+/// use arrow2::datatypes::{DataType, Field, Schema};
+/// use arrow2::chunk::Chunk;
+/// use arrow2::io::ipc::write::file_async::FileSink;
+/// use arrow2::io::ipc::read::file_async::{read_file_metadata_async, FileStream};
+/// # futures::executor::block_on(async move {
+/// let schema = Schema::from(vec![
+///     Field::new("values", DataType::Int32, true),
+/// ]);
+///
+/// let mut buffer = Cursor::new(vec![]);
+/// let mut sink = FileSink::new(
+///     &mut buffer,
+///     schema,
+///     None,
+///     Default::default(),
+/// );
+///
+/// // Write chunks to file
+/// for i in 0..3 {
+///     let values = Int32Array::from(&[Some(i), None]);
+///     let chunk = Chunk::new(vec![values.boxed()]);
+///     sink.feed(chunk.into()).await?;
+/// }
+/// sink.close().await?;
+/// drop(sink);
+///
+/// // Read chunks from file
+/// buffer.set_position(0);
+/// let metadata = read_file_metadata_async(&mut buffer).await?;
+/// let mut stream = FileStream::new(buffer, metadata, None, None);
+/// let chunks = stream.try_collect::<Vec<_>>().await?;
+/// # arrow2::error::Result::Ok(())
+/// # }).unwrap();
+/// ```
+pub struct FileSink<'a, W: AsyncWrite + Unpin + Send + 'a> {
+    writer: Option<W>,
+    task: Option<BoxFuture<'a, Result<WriteOutput<W>>>>,
+    options: WriteOptions,
+    dictionary_tracker: DictionaryTracker,
+    offset: usize,
+    fields: Vec<IpcField>,
+    record_blocks: Vec<Block>,
+    dictionary_blocks: Vec<Block>,
+    schema: Schema,
+}
+
+impl<'a, W> FileSink<'a, W>
+where
+    W: AsyncWrite + Unpin + Send + 'a,
+{
+    /// Create a new file writer.
+    pub fn new(
+        writer: W,
+        schema: Schema,
+        ipc_fields: Option<Vec<IpcField>>,
+        options: WriteOptions,
+    ) -> Self {
+        let fields = ipc_fields.unwrap_or_else(|| default_ipc_fields(&schema.fields));
+        let encoded = EncodedData {
+            ipc_message: schema_to_bytes(&schema, &fields),
+            arrow_data: vec![],
+        };
+        let task = Some(Self::start(writer, encoded).boxed());
+        Self {
+            writer: None,
+            task,
+            options,
+            fields,
+            offset: 0,
+            schema,
+            dictionary_tracker: DictionaryTracker {
+                dictionaries: Default::default(),
+                cannot_replace: true,
+            },
+            record_blocks: vec![],
+            dictionary_blocks: vec![],
+        }
+    }
+
+    async fn start(mut writer: W, encoded: EncodedData) -> Result<WriteOutput<W>> {
+        writer.write_all(&ARROW_MAGIC_V2[..]).await?;
+        writer.write_all(&[0, 0]).await?;
+        let (meta, data) = write_message(&mut writer, encoded).await?;
+
+        Ok((meta + data + 8, None, vec![], Some(writer)))
+    }
+
+    async fn write(
+        mut writer: W,
+        mut offset: usize,
+        record: EncodedData,
+        dictionaries: Vec<EncodedData>,
+    ) -> Result<WriteOutput<W>> {
+        let mut dict_blocks = vec![];
+        for dict in dictionaries {
+            let (meta, data) = write_message(&mut writer, dict).await?;
+            let block = Block {
+                offset: offset as i64,
+                meta_data_length: meta as i32,
+                body_length: data as i64,
+            };
+            dict_blocks.push(block);
+            offset += meta + data;
+        }
+        let (meta, data) = write_message(&mut writer, record).await?;
+        let block = Block {
+            offset: offset as i64,
+            meta_data_length: meta as i32,
+            body_length: data as i64,
+        };
+        offset += meta + data;
+        Ok((offset, Some(block), dict_blocks, Some(writer)))
+    }
+
+    async fn finish(mut writer: W, footer: Footer) -> Result<WriteOutput<W>> {
+        write_continuation(&mut writer, 0).await?;
+        let footer = {
+            let mut builder = Builder::new();
+            builder.finish(&footer, None).to_owned()
+        };
+        writer.write_all(&footer[..]).await?;
+        writer
+            .write_all(&(footer.len() as i32).to_le_bytes())
+            .await?;
+        writer.write_all(&ARROW_MAGIC_V2).await?;
+        writer.close().await?;
+
+        Ok((0, None, vec![], None))
+    }
+
+    fn poll_write(&mut self, cx: &mut std::task::Context<'_>) -> Poll<Result<()>> {
+        if let Some(task) = &mut self.task {
+            match futures::ready!(task.poll_unpin(cx)) {
+                Ok((offset, record, mut dictionaries, writer)) => {
+                    self.task = None;
+                    self.writer = writer;
+                    self.offset = offset;
+                    if let Some(block) = record {
+                        self.record_blocks.push(block);
+                    }
+                    self.dictionary_blocks.append(&mut dictionaries);
+                    Poll::Ready(Ok(()))
+                },
+                Err(error) => {
+                    self.task = None;
+                    Poll::Ready(Err(error))
+                },
+            }
+        } else {
+            Poll::Ready(Ok(()))
+        }
+    }
+}
+
+impl<'a, W> Sink<Record<'_>> for FileSink<'a, W>
+where
+    W: AsyncWrite + Unpin + Send + 'a,
+{
+    type Error = Error;
+
+    fn poll_ready(
+        self: std::pin::Pin<&mut Self>,
+        cx: &mut std::task::Context<'_>,
+    ) -> std::task::Poll<Result<()>> {
+        self.get_mut().poll_write(cx)
+    }
+
+    fn start_send(self: std::pin::Pin<&mut Self>, item: Record<'_>) -> Result<()> {
+        let this = self.get_mut();
+
+        if let Some(writer) = this.writer.take() {
+            let fields = item.fields().unwrap_or_else(|| &this.fields[..]);
+
+            let (dictionaries, record) = encode_chunk(
+                item.columns(),
+                fields,
+                &mut this.dictionary_tracker,
+                &this.options,
+            )?;
+
+            this.task = Some(Self::write(writer, this.offset, record, dictionaries).boxed());
+            Ok(())
+        } else {
+            Err(Error::Io(std::io::Error::new(
+                std::io::ErrorKind::UnexpectedEof,
+                "writer is closed",
+            )))
+        }
+    }
+
+    fn poll_flush(
+        self: std::pin::Pin<&mut Self>,
+        cx: &mut std::task::Context<'_>,
+    ) -> std::task::Poll<Result<()>> {
+        self.get_mut().poll_write(cx)
+    }
+
+    fn poll_close(
+        self: std::pin::Pin<&mut Self>,
+        cx: &mut std::task::Context<'_>,
+    ) -> std::task::Poll<Result<()>> {
+        let this = self.get_mut();
+        match futures::ready!(this.poll_write(cx)) {
+            Ok(()) => {
+                if let Some(writer) = this.writer.take() {
+                    let schema = serialize_schema(&this.schema, &this.fields);
+                    let footer = Footer {
+                        version: MetadataVersion::V5,
+                        schema: Some(Box::new(schema)),
+                        dictionaries: Some(std::mem::take(&mut this.dictionary_blocks)),
+                        record_batches: Some(std::mem::take(&mut this.record_blocks)),
+                        custom_metadata: None,
+                    };
+                    this.task = Some(Self::finish(writer, footer).boxed());
+                    this.poll_write(cx)
+                } else {
+                    Poll::Ready(Ok(()))
+                }
+            },
+            Err(error) => Poll::Ready(Err(error)),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/io/ipc/write/mod.rs b/crates/nano-arrow/src/io/ipc/write/mod.rs
new file mode 100644
index 000000000000..55672a85da3c
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/write/mod.rs
@@ -0,0 +1,70 @@
+//! APIs to write to Arrow's IPC format.
+pub(crate) mod common;
+mod schema;
+mod serialize;
+mod stream;
+pub(crate) mod writer;
+
+pub use common::{Compression, Record, WriteOptions};
+pub use schema::schema_to_bytes;
+pub use serialize::write;
+use serialize::write_dictionary;
+pub use stream::StreamWriter;
+pub use writer::FileWriter;
+
+pub(crate) mod common_sync;
+
+#[cfg(feature = "io_ipc_write_async")]
+mod common_async;
+#[cfg(feature = "io_ipc_write_async")]
+#[cfg_attr(docsrs, doc(cfg(feature = "io_ipc_write_async")))]
+pub mod stream_async;
+
+#[cfg(feature = "io_ipc_write_async")]
+#[cfg_attr(docsrs, doc(cfg(feature = "io_ipc_write_async")))]
+pub mod file_async;
+
+use super::IpcField;
+use crate::datatypes::{DataType, Field};
+
+fn default_ipc_field(data_type: &DataType, current_id: &mut i64) -> IpcField {
+    use crate::datatypes::DataType::*;
+    match data_type.to_logical_type() {
+        // single child => recurse
+        Map(inner, ..) | FixedSizeList(inner, _) | LargeList(inner) | List(inner) => IpcField {
+            fields: vec![default_ipc_field(inner.data_type(), current_id)],
+            dictionary_id: None,
+        },
+        // multiple children => recurse
+        Union(fields, ..) | Struct(fields) => IpcField {
+            fields: fields
+                .iter()
+                .map(|f| default_ipc_field(f.data_type(), current_id))
+                .collect(),
+            dictionary_id: None,
+        },
+        // dictionary => current_id
+        Dictionary(_, data_type, _) => {
+            let dictionary_id = Some(*current_id);
+            *current_id += 1;
+            IpcField {
+                fields: vec![default_ipc_field(data_type, current_id)],
+                dictionary_id,
+            }
+        },
+        // no children => do nothing
+        _ => IpcField {
+            fields: vec![],
+            dictionary_id: None,
+        },
+    }
+}
+
+/// Assigns every dictionary field a unique ID
+pub fn default_ipc_fields(fields: &[Field]) -> Vec<IpcField> {
+    let mut dictionary_id = 0i64;
+    fields
+        .iter()
+        .map(|field| default_ipc_field(field.data_type().to_logical_type(), &mut dictionary_id))
+        .collect()
+}
diff --git a/crates/nano-arrow/src/io/ipc/write/schema.rs b/crates/nano-arrow/src/io/ipc/write/schema.rs
new file mode 100644
index 000000000000..dd6f44bbd33a
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/write/schema.rs
@@ -0,0 +1,333 @@
+use arrow_format::ipc::planus::Builder;
+
+use super::super::IpcField;
+use crate::datatypes::{
+    DataType, Field, IntegerType, IntervalUnit, Metadata, Schema, TimeUnit, UnionMode,
+};
+use crate::io::ipc::endianness::is_native_little_endian;
+
+/// Converts a [Schema] and [IpcField]s to a flatbuffers-encoded [arrow_format::ipc::Message].
+pub fn schema_to_bytes(schema: &Schema, ipc_fields: &[IpcField]) -> Vec<u8> {
+    let schema = serialize_schema(schema, ipc_fields);
+
+    let message = arrow_format::ipc::Message {
+        version: arrow_format::ipc::MetadataVersion::V5,
+        header: Some(arrow_format::ipc::MessageHeader::Schema(Box::new(schema))),
+        body_length: 0,
+        custom_metadata: None, // todo: allow writing custom metadata
+    };
+    let mut builder = Builder::new();
+    let footer_data = builder.finish(&message, None);
+    footer_data.to_vec()
+}
+
+pub fn serialize_schema(schema: &Schema, ipc_fields: &[IpcField]) -> arrow_format::ipc::Schema {
+    let endianness = if is_native_little_endian() {
+        arrow_format::ipc::Endianness::Little
+    } else {
+        arrow_format::ipc::Endianness::Big
+    };
+
+    let fields = schema
+        .fields
+        .iter()
+        .zip(ipc_fields.iter())
+        .map(|(field, ipc_field)| serialize_field(field, ipc_field))
+        .collect::<Vec<_>>();
+
+    let mut custom_metadata = vec![];
+    for (key, value) in &schema.metadata {
+        custom_metadata.push(arrow_format::ipc::KeyValue {
+            key: Some(key.clone()),
+            value: Some(value.clone()),
+        });
+    }
+    let custom_metadata = if custom_metadata.is_empty() {
+        None
+    } else {
+        Some(custom_metadata)
+    };
+
+    arrow_format::ipc::Schema {
+        endianness,
+        fields: Some(fields),
+        custom_metadata,
+        features: None, // todo add this one
+    }
+}
+
+fn write_metadata(metadata: &Metadata, kv_vec: &mut Vec<arrow_format::ipc::KeyValue>) {
+    for (k, v) in metadata {
+        if k != "ARROW:extension:name" && k != "ARROW:extension:metadata" {
+            let entry = arrow_format::ipc::KeyValue {
+                key: Some(k.clone()),
+                value: Some(v.clone()),
+            };
+            kv_vec.push(entry);
+        }
+    }
+}
+
+fn write_extension(
+    name: &str,
+    metadata: &Option<String>,
+    kv_vec: &mut Vec<arrow_format::ipc::KeyValue>,
+) {
+    // metadata
+    if let Some(metadata) = metadata {
+        let entry = arrow_format::ipc::KeyValue {
+            key: Some("ARROW:extension:metadata".to_string()),
+            value: Some(metadata.clone()),
+        };
+        kv_vec.push(entry);
+    }
+
+    // name
+    let entry = arrow_format::ipc::KeyValue {
+        key: Some("ARROW:extension:name".to_string()),
+        value: Some(name.to_string()),
+    };
+    kv_vec.push(entry);
+}
+
+/// Create an IPC Field from an Arrow Field
+pub(crate) fn serialize_field(field: &Field, ipc_field: &IpcField) -> arrow_format::ipc::Field {
+    // custom metadata.
+    let mut kv_vec = vec![];
+    if let DataType::Extension(name, _, metadata) = field.data_type() {
+        write_extension(name, metadata, &mut kv_vec);
+    }
+
+    let type_ = serialize_type(field.data_type());
+    let children = serialize_children(field.data_type(), ipc_field);
+
+    let dictionary = if let DataType::Dictionary(index_type, inner, is_ordered) = field.data_type()
+    {
+        if let DataType::Extension(name, _, metadata) = inner.as_ref() {
+            write_extension(name, metadata, &mut kv_vec);
+        }
+        Some(serialize_dictionary(
+            index_type,
+            ipc_field
+                .dictionary_id
+                .expect("All Dictionary types have `dict_id`"),
+            *is_ordered,
+        ))
+    } else {
+        None
+    };
+
+    write_metadata(&field.metadata, &mut kv_vec);
+
+    let custom_metadata = if !kv_vec.is_empty() {
+        Some(kv_vec)
+    } else {
+        None
+    };
+
+    arrow_format::ipc::Field {
+        name: Some(field.name.clone()),
+        nullable: field.is_nullable,
+        type_: Some(type_),
+        dictionary: dictionary.map(Box::new),
+        children: Some(children),
+        custom_metadata,
+    }
+}
+
+fn serialize_time_unit(unit: &TimeUnit) -> arrow_format::ipc::TimeUnit {
+    match unit {
+        TimeUnit::Second => arrow_format::ipc::TimeUnit::Second,
+        TimeUnit::Millisecond => arrow_format::ipc::TimeUnit::Millisecond,
+        TimeUnit::Microsecond => arrow_format::ipc::TimeUnit::Microsecond,
+        TimeUnit::Nanosecond => arrow_format::ipc::TimeUnit::Nanosecond,
+    }
+}
+
+fn serialize_type(data_type: &DataType) -> arrow_format::ipc::Type {
+    use arrow_format::ipc;
+    use DataType::*;
+    match data_type {
+        Null => ipc::Type::Null(Box::new(ipc::Null {})),
+        Boolean => ipc::Type::Bool(Box::new(ipc::Bool {})),
+        UInt8 => ipc::Type::Int(Box::new(ipc::Int {
+            bit_width: 8,
+            is_signed: false,
+        })),
+        UInt16 => ipc::Type::Int(Box::new(ipc::Int {
+            bit_width: 16,
+            is_signed: false,
+        })),
+        UInt32 => ipc::Type::Int(Box::new(ipc::Int {
+            bit_width: 32,
+            is_signed: false,
+        })),
+        UInt64 => ipc::Type::Int(Box::new(ipc::Int {
+            bit_width: 64,
+            is_signed: false,
+        })),
+        Int8 => ipc::Type::Int(Box::new(ipc::Int {
+            bit_width: 8,
+            is_signed: true,
+        })),
+        Int16 => ipc::Type::Int(Box::new(ipc::Int {
+            bit_width: 16,
+            is_signed: true,
+        })),
+        Int32 => ipc::Type::Int(Box::new(ipc::Int {
+            bit_width: 32,
+            is_signed: true,
+        })),
+        Int64 => ipc::Type::Int(Box::new(ipc::Int {
+            bit_width: 64,
+            is_signed: true,
+        })),
+        Float16 => ipc::Type::FloatingPoint(Box::new(ipc::FloatingPoint {
+            precision: ipc::Precision::Half,
+        })),
+        Float32 => ipc::Type::FloatingPoint(Box::new(ipc::FloatingPoint {
+            precision: ipc::Precision::Single,
+        })),
+        Float64 => ipc::Type::FloatingPoint(Box::new(ipc::FloatingPoint {
+            precision: ipc::Precision::Double,
+        })),
+        Decimal(precision, scale) => ipc::Type::Decimal(Box::new(ipc::Decimal {
+            precision: *precision as i32,
+            scale: *scale as i32,
+            bit_width: 128,
+        })),
+        Decimal256(precision, scale) => ipc::Type::Decimal(Box::new(ipc::Decimal {
+            precision: *precision as i32,
+            scale: *scale as i32,
+            bit_width: 256,
+        })),
+        Binary => ipc::Type::Binary(Box::new(ipc::Binary {})),
+        LargeBinary => ipc::Type::LargeBinary(Box::new(ipc::LargeBinary {})),
+        Utf8 => ipc::Type::Utf8(Box::new(ipc::Utf8 {})),
+        LargeUtf8 => ipc::Type::LargeUtf8(Box::new(ipc::LargeUtf8 {})),
+        FixedSizeBinary(size) => ipc::Type::FixedSizeBinary(Box::new(ipc::FixedSizeBinary {
+            byte_width: *size as i32,
+        })),
+        Date32 => ipc::Type::Date(Box::new(ipc::Date {
+            unit: ipc::DateUnit::Day,
+        })),
+        Date64 => ipc::Type::Date(Box::new(ipc::Date {
+            unit: ipc::DateUnit::Millisecond,
+        })),
+        Duration(unit) => ipc::Type::Duration(Box::new(ipc::Duration {
+            unit: serialize_time_unit(unit),
+        })),
+        Time32(unit) => ipc::Type::Time(Box::new(ipc::Time {
+            unit: serialize_time_unit(unit),
+            bit_width: 32,
+        })),
+        Time64(unit) => ipc::Type::Time(Box::new(ipc::Time {
+            unit: serialize_time_unit(unit),
+            bit_width: 64,
+        })),
+        Timestamp(unit, tz) => ipc::Type::Timestamp(Box::new(ipc::Timestamp {
+            unit: serialize_time_unit(unit),
+            timezone: tz.as_ref().cloned(),
+        })),
+        Interval(unit) => ipc::Type::Interval(Box::new(ipc::Interval {
+            unit: match unit {
+                IntervalUnit::YearMonth => ipc::IntervalUnit::YearMonth,
+                IntervalUnit::DayTime => ipc::IntervalUnit::DayTime,
+                IntervalUnit::MonthDayNano => ipc::IntervalUnit::MonthDayNano,
+            },
+        })),
+        List(_) => ipc::Type::List(Box::new(ipc::List {})),
+        LargeList(_) => ipc::Type::LargeList(Box::new(ipc::LargeList {})),
+        FixedSizeList(_, size) => ipc::Type::FixedSizeList(Box::new(ipc::FixedSizeList {
+            list_size: *size as i32,
+        })),
+        Union(_, type_ids, mode) => ipc::Type::Union(Box::new(ipc::Union {
+            mode: match mode {
+                UnionMode::Dense => ipc::UnionMode::Dense,
+                UnionMode::Sparse => ipc::UnionMode::Sparse,
+            },
+            type_ids: type_ids.clone(),
+        })),
+        Map(_, keys_sorted) => ipc::Type::Map(Box::new(ipc::Map {
+            keys_sorted: *keys_sorted,
+        })),
+        Struct(_) => ipc::Type::Struct(Box::new(ipc::Struct {})),
+        Dictionary(_, v, _) => serialize_type(v),
+        Extension(_, v, _) => serialize_type(v),
+    }
+}
+
+fn serialize_children(data_type: &DataType, ipc_field: &IpcField) -> Vec<arrow_format::ipc::Field> {
+    use DataType::*;
+    match data_type {
+        Null
+        | Boolean
+        | Int8
+        | Int16
+        | Int32
+        | Int64
+        | UInt8
+        | UInt16
+        | UInt32
+        | UInt64
+        | Float16
+        | Float32
+        | Float64
+        | Timestamp(_, _)
+        | Date32
+        | Date64
+        | Time32(_)
+        | Time64(_)
+        | Duration(_)
+        | Interval(_)
+        | Binary
+        | FixedSizeBinary(_)
+        | LargeBinary
+        | Utf8
+        | LargeUtf8
+        | Decimal(_, _)
+        | Decimal256(_, _) => vec![],
+        FixedSizeList(inner, _) | LargeList(inner) | List(inner) | Map(inner, _) => {
+            vec![serialize_field(inner, &ipc_field.fields[0])]
+        },
+        Union(fields, _, _) | Struct(fields) => fields
+            .iter()
+            .zip(ipc_field.fields.iter())
+            .map(|(field, ipc)| serialize_field(field, ipc))
+            .collect(),
+        Dictionary(_, inner, _) => serialize_children(inner, ipc_field),
+        Extension(_, inner, _) => serialize_children(inner, ipc_field),
+    }
+}
+
+/// Create an IPC dictionary encoding
+pub(crate) fn serialize_dictionary(
+    index_type: &IntegerType,
+    dict_id: i64,
+    dict_is_ordered: bool,
+) -> arrow_format::ipc::DictionaryEncoding {
+    use IntegerType::*;
+    let is_signed = match index_type {
+        Int8 | Int16 | Int32 | Int64 => true,
+        UInt8 | UInt16 | UInt32 | UInt64 => false,
+    };
+
+    let bit_width = match index_type {
+        Int8 | UInt8 => 8,
+        Int16 | UInt16 => 16,
+        Int32 | UInt32 => 32,
+        Int64 | UInt64 => 64,
+    };
+
+    let index_type = arrow_format::ipc::Int {
+        bit_width,
+        is_signed,
+    };
+
+    arrow_format::ipc::DictionaryEncoding {
+        id: dict_id,
+        index_type: Some(Box::new(index_type)),
+        is_ordered: dict_is_ordered,
+        dictionary_kind: arrow_format::ipc::DictionaryKind::DenseArray,
+    }
+}
diff --git a/crates/nano-arrow/src/io/ipc/write/serialize.rs b/crates/nano-arrow/src/io/ipc/write/serialize.rs
new file mode 100644
index 000000000000..f5bad22d6fe4
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/write/serialize.rs
@@ -0,0 +1,763 @@
+#![allow(clippy::ptr_arg)] // false positive in clippy, see https://github.com/rust-lang/rust-clippy/issues/8463
+use arrow_format::ipc;
+
+use super::super::compression;
+use super::super::endianness::is_native_little_endian;
+use super::common::{pad_to_64, Compression};
+use crate::array::*;
+use crate::bitmap::Bitmap;
+use crate::datatypes::PhysicalType;
+use crate::offset::{Offset, OffsetsBuffer};
+use crate::trusted_len::TrustedLen;
+use crate::types::NativeType;
+
+fn write_primitive<T: NativeType>(
+    array: &PrimitiveArray<T>,
+    buffers: &mut Vec<ipc::Buffer>,
+    arrow_data: &mut Vec<u8>,
+    offset: &mut i64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+) {
+    write_bitmap(
+        array.validity(),
+        array.len(),
+        buffers,
+        arrow_data,
+        offset,
+        compression,
+    );
+
+    write_buffer(
+        array.values(),
+        buffers,
+        arrow_data,
+        offset,
+        is_little_endian,
+        compression,
+    )
+}
+
+fn write_boolean(
+    array: &BooleanArray,
+    buffers: &mut Vec<ipc::Buffer>,
+    arrow_data: &mut Vec<u8>,
+    offset: &mut i64,
+    _: bool,
+    compression: Option<Compression>,
+) {
+    write_bitmap(
+        array.validity(),
+        array.len(),
+        buffers,
+        arrow_data,
+        offset,
+        compression,
+    );
+    write_bitmap(
+        Some(&array.values().clone()),
+        array.len(),
+        buffers,
+        arrow_data,
+        offset,
+        compression,
+    );
+}
+
+#[allow(clippy::too_many_arguments)]
+fn write_generic_binary<O: Offset>(
+    validity: Option<&Bitmap>,
+    offsets: &OffsetsBuffer<O>,
+    values: &[u8],
+    buffers: &mut Vec<ipc::Buffer>,
+    arrow_data: &mut Vec<u8>,
+    offset: &mut i64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+) {
+    let offsets = offsets.buffer();
+    write_bitmap(
+        validity,
+        offsets.len() - 1,
+        buffers,
+        arrow_data,
+        offset,
+        compression,
+    );
+
+    let first = *offsets.first().unwrap();
+    let last = *offsets.last().unwrap();
+    if first == O::default() {
+        write_buffer(
+            offsets,
+            buffers,
+            arrow_data,
+            offset,
+            is_little_endian,
+            compression,
+        );
+    } else {
+        write_buffer_from_iter(
+            offsets.iter().map(|x| *x - first),
+            buffers,
+            arrow_data,
+            offset,
+            is_little_endian,
+            compression,
+        );
+    }
+
+    write_bytes(
+        &values[first.to_usize()..last.to_usize()],
+        buffers,
+        arrow_data,
+        offset,
+        compression,
+    );
+}
+
+fn write_binary<O: Offset>(
+    array: &BinaryArray<O>,
+    buffers: &mut Vec<ipc::Buffer>,
+    arrow_data: &mut Vec<u8>,
+    offset: &mut i64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+) {
+    write_generic_binary(
+        array.validity(),
+        array.offsets(),
+        array.values(),
+        buffers,
+        arrow_data,
+        offset,
+        is_little_endian,
+        compression,
+    );
+}
+
+fn write_utf8<O: Offset>(
+    array: &Utf8Array<O>,
+    buffers: &mut Vec<ipc::Buffer>,
+    arrow_data: &mut Vec<u8>,
+    offset: &mut i64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+) {
+    write_generic_binary(
+        array.validity(),
+        array.offsets(),
+        array.values(),
+        buffers,
+        arrow_data,
+        offset,
+        is_little_endian,
+        compression,
+    );
+}
+
+fn write_fixed_size_binary(
+    array: &FixedSizeBinaryArray,
+    buffers: &mut Vec<ipc::Buffer>,
+    arrow_data: &mut Vec<u8>,
+    offset: &mut i64,
+    _is_little_endian: bool,
+    compression: Option<Compression>,
+) {
+    write_bitmap(
+        array.validity(),
+        array.len(),
+        buffers,
+        arrow_data,
+        offset,
+        compression,
+    );
+    write_bytes(array.values(), buffers, arrow_data, offset, compression);
+}
+
+fn write_list<O: Offset>(
+    array: &ListArray<O>,
+    buffers: &mut Vec<ipc::Buffer>,
+    arrow_data: &mut Vec<u8>,
+    nodes: &mut Vec<ipc::FieldNode>,
+    offset: &mut i64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+) {
+    let offsets = array.offsets().buffer();
+    let validity = array.validity();
+
+    write_bitmap(
+        validity,
+        offsets.len() - 1,
+        buffers,
+        arrow_data,
+        offset,
+        compression,
+    );
+
+    let first = *offsets.first().unwrap();
+    let last = *offsets.last().unwrap();
+    if first == O::zero() {
+        write_buffer(
+            offsets,
+            buffers,
+            arrow_data,
+            offset,
+            is_little_endian,
+            compression,
+        );
+    } else {
+        write_buffer_from_iter(
+            offsets.iter().map(|x| *x - first),
+            buffers,
+            arrow_data,
+            offset,
+            is_little_endian,
+            compression,
+        );
+    }
+
+    write(
+        array
+            .values()
+            .sliced(first.to_usize(), last.to_usize() - first.to_usize())
+            .as_ref(),
+        buffers,
+        arrow_data,
+        nodes,
+        offset,
+        is_little_endian,
+        compression,
+    );
+}
+
+pub fn write_struct(
+    array: &StructArray,
+    buffers: &mut Vec<ipc::Buffer>,
+    arrow_data: &mut Vec<u8>,
+    nodes: &mut Vec<ipc::FieldNode>,
+    offset: &mut i64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+) {
+    write_bitmap(
+        array.validity(),
+        array.len(),
+        buffers,
+        arrow_data,
+        offset,
+        compression,
+    );
+    array.values().iter().for_each(|array| {
+        write(
+            array.as_ref(),
+            buffers,
+            arrow_data,
+            nodes,
+            offset,
+            is_little_endian,
+            compression,
+        );
+    });
+}
+
+pub fn write_union(
+    array: &UnionArray,
+    buffers: &mut Vec<ipc::Buffer>,
+    arrow_data: &mut Vec<u8>,
+    nodes: &mut Vec<ipc::FieldNode>,
+    offset: &mut i64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+) {
+    write_buffer(
+        array.types(),
+        buffers,
+        arrow_data,
+        offset,
+        is_little_endian,
+        compression,
+    );
+
+    if let Some(offsets) = array.offsets() {
+        write_buffer(
+            offsets,
+            buffers,
+            arrow_data,
+            offset,
+            is_little_endian,
+            compression,
+        );
+    }
+    array.fields().iter().for_each(|array| {
+        write(
+            array.as_ref(),
+            buffers,
+            arrow_data,
+            nodes,
+            offset,
+            is_little_endian,
+            compression,
+        )
+    });
+}
+
+fn write_map(
+    array: &MapArray,
+    buffers: &mut Vec<ipc::Buffer>,
+    arrow_data: &mut Vec<u8>,
+    nodes: &mut Vec<ipc::FieldNode>,
+    offset: &mut i64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+) {
+    let offsets = array.offsets().buffer();
+    let validity = array.validity();
+
+    write_bitmap(
+        validity,
+        offsets.len() - 1,
+        buffers,
+        arrow_data,
+        offset,
+        compression,
+    );
+
+    let first = *offsets.first().unwrap();
+    let last = *offsets.last().unwrap();
+    if first == 0 {
+        write_buffer(
+            offsets,
+            buffers,
+            arrow_data,
+            offset,
+            is_little_endian,
+            compression,
+        );
+    } else {
+        write_buffer_from_iter(
+            offsets.iter().map(|x| *x - first),
+            buffers,
+            arrow_data,
+            offset,
+            is_little_endian,
+            compression,
+        );
+    }
+
+    write(
+        array
+            .field()
+            .sliced(first as usize, last as usize - first as usize)
+            .as_ref(),
+        buffers,
+        arrow_data,
+        nodes,
+        offset,
+        is_little_endian,
+        compression,
+    );
+}
+
+fn write_fixed_size_list(
+    array: &FixedSizeListArray,
+    buffers: &mut Vec<ipc::Buffer>,
+    arrow_data: &mut Vec<u8>,
+    nodes: &mut Vec<ipc::FieldNode>,
+    offset: &mut i64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+) {
+    write_bitmap(
+        array.validity(),
+        array.len(),
+        buffers,
+        arrow_data,
+        offset,
+        compression,
+    );
+    write(
+        array.values().as_ref(),
+        buffers,
+        arrow_data,
+        nodes,
+        offset,
+        is_little_endian,
+        compression,
+    );
+}
+
+// use `write_keys` to either write keys or values
+#[allow(clippy::too_many_arguments)]
+pub(super) fn write_dictionary<K: DictionaryKey>(
+    array: &DictionaryArray<K>,
+    buffers: &mut Vec<ipc::Buffer>,
+    arrow_data: &mut Vec<u8>,
+    nodes: &mut Vec<ipc::FieldNode>,
+    offset: &mut i64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+    write_keys: bool,
+) -> usize {
+    if write_keys {
+        write_primitive(
+            array.keys(),
+            buffers,
+            arrow_data,
+            offset,
+            is_little_endian,
+            compression,
+        );
+        array.keys().len()
+    } else {
+        write(
+            array.values().as_ref(),
+            buffers,
+            arrow_data,
+            nodes,
+            offset,
+            is_little_endian,
+            compression,
+        );
+        array.values().len()
+    }
+}
+
+/// Writes an [`Array`] to `arrow_data`
+pub fn write(
+    array: &dyn Array,
+    buffers: &mut Vec<ipc::Buffer>,
+    arrow_data: &mut Vec<u8>,
+    nodes: &mut Vec<ipc::FieldNode>,
+    offset: &mut i64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+) {
+    nodes.push(ipc::FieldNode {
+        length: array.len() as i64,
+        null_count: array.null_count() as i64,
+    });
+    use PhysicalType::*;
+    match array.data_type().to_physical_type() {
+        Null => (),
+        Boolean => write_boolean(
+            array.as_any().downcast_ref().unwrap(),
+            buffers,
+            arrow_data,
+            offset,
+            is_little_endian,
+            compression,
+        ),
+        Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+            let array = array.as_any().downcast_ref().unwrap();
+            write_primitive::<$T>(array, buffers, arrow_data, offset, is_little_endian, compression)
+        }),
+        Binary => write_binary::<i32>(
+            array.as_any().downcast_ref().unwrap(),
+            buffers,
+            arrow_data,
+            offset,
+            is_little_endian,
+            compression,
+        ),
+        LargeBinary => write_binary::<i64>(
+            array.as_any().downcast_ref().unwrap(),
+            buffers,
+            arrow_data,
+            offset,
+            is_little_endian,
+            compression,
+        ),
+        FixedSizeBinary => write_fixed_size_binary(
+            array.as_any().downcast_ref().unwrap(),
+            buffers,
+            arrow_data,
+            offset,
+            is_little_endian,
+            compression,
+        ),
+        Utf8 => write_utf8::<i32>(
+            array.as_any().downcast_ref().unwrap(),
+            buffers,
+            arrow_data,
+            offset,
+            is_little_endian,
+            compression,
+        ),
+        LargeUtf8 => write_utf8::<i64>(
+            array.as_any().downcast_ref().unwrap(),
+            buffers,
+            arrow_data,
+            offset,
+            is_little_endian,
+            compression,
+        ),
+        List => write_list::<i32>(
+            array.as_any().downcast_ref().unwrap(),
+            buffers,
+            arrow_data,
+            nodes,
+            offset,
+            is_little_endian,
+            compression,
+        ),
+        LargeList => write_list::<i64>(
+            array.as_any().downcast_ref().unwrap(),
+            buffers,
+            arrow_data,
+            nodes,
+            offset,
+            is_little_endian,
+            compression,
+        ),
+        FixedSizeList => write_fixed_size_list(
+            array.as_any().downcast_ref().unwrap(),
+            buffers,
+            arrow_data,
+            nodes,
+            offset,
+            is_little_endian,
+            compression,
+        ),
+        Struct => write_struct(
+            array.as_any().downcast_ref().unwrap(),
+            buffers,
+            arrow_data,
+            nodes,
+            offset,
+            is_little_endian,
+            compression,
+        ),
+        Dictionary(key_type) => match_integer_type!(key_type, |$T| {
+            write_dictionary::<$T>(
+                array.as_any().downcast_ref().unwrap(),
+                buffers,
+                arrow_data,
+                nodes,
+                offset,
+                is_little_endian,
+                compression,
+                true,
+            );
+        }),
+        Union => {
+            write_union(
+                array.as_any().downcast_ref().unwrap(),
+                buffers,
+                arrow_data,
+                nodes,
+                offset,
+                is_little_endian,
+                compression,
+            );
+        },
+        Map => {
+            write_map(
+                array.as_any().downcast_ref().unwrap(),
+                buffers,
+                arrow_data,
+                nodes,
+                offset,
+                is_little_endian,
+                compression,
+            );
+        },
+    }
+}
+
+#[inline]
+fn pad_buffer_to_64(buffer: &mut Vec<u8>, length: usize) {
+    let pad_len = pad_to_64(length);
+    buffer.extend_from_slice(&vec![0u8; pad_len]);
+}
+
+/// writes `bytes` to `arrow_data` updating `buffers` and `offset` and guaranteeing a 8 byte boundary.
+fn write_bytes(
+    bytes: &[u8],
+    buffers: &mut Vec<ipc::Buffer>,
+    arrow_data: &mut Vec<u8>,
+    offset: &mut i64,
+    compression: Option<Compression>,
+) {
+    let start = arrow_data.len();
+    if let Some(compression) = compression {
+        arrow_data.extend_from_slice(&(bytes.len() as i64).to_le_bytes());
+        match compression {
+            Compression::LZ4 => {
+                compression::compress_lz4(bytes, arrow_data).unwrap();
+            },
+            Compression::ZSTD => {
+                compression::compress_zstd(bytes, arrow_data).unwrap();
+            },
+        }
+    } else {
+        arrow_data.extend_from_slice(bytes);
+    };
+
+    buffers.push(finish_buffer(arrow_data, start, offset));
+}
+
+fn write_bitmap(
+    bitmap: Option<&Bitmap>,
+    length: usize,
+    buffers: &mut Vec<ipc::Buffer>,
+    arrow_data: &mut Vec<u8>,
+    offset: &mut i64,
+    compression: Option<Compression>,
+) {
+    match bitmap {
+        Some(bitmap) => {
+            assert_eq!(bitmap.len(), length);
+            let (slice, slice_offset, _) = bitmap.as_slice();
+            if slice_offset != 0 {
+                // case where we can't slice the bitmap as the offsets are not multiple of 8
+                let bytes = Bitmap::from_trusted_len_iter(bitmap.iter());
+                let (slice, _, _) = bytes.as_slice();
+                write_bytes(slice, buffers, arrow_data, offset, compression)
+            } else {
+                write_bytes(slice, buffers, arrow_data, offset, compression)
+            }
+        },
+        None => {
+            buffers.push(ipc::Buffer {
+                offset: *offset,
+                length: 0,
+            });
+        },
+    }
+}
+
+/// writes `bytes` to `arrow_data` updating `buffers` and `offset` and guaranteeing a 8 byte boundary.
+fn write_buffer<T: NativeType>(
+    buffer: &[T],
+    buffers: &mut Vec<ipc::Buffer>,
+    arrow_data: &mut Vec<u8>,
+    offset: &mut i64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+) {
+    let start = arrow_data.len();
+    if let Some(compression) = compression {
+        _write_compressed_buffer(buffer, arrow_data, is_little_endian, compression);
+    } else {
+        _write_buffer(buffer, arrow_data, is_little_endian);
+    };
+
+    buffers.push(finish_buffer(arrow_data, start, offset));
+}
+
+#[inline]
+fn _write_buffer_from_iter<T: NativeType, I: TrustedLen<Item = T>>(
+    buffer: I,
+    arrow_data: &mut Vec<u8>,
+    is_little_endian: bool,
+) {
+    let len = buffer.size_hint().0;
+    arrow_data.reserve(len * std::mem::size_of::<T>());
+    if is_little_endian {
+        buffer
+            .map(|x| T::to_le_bytes(&x))
+            .for_each(|x| arrow_data.extend_from_slice(x.as_ref()))
+    } else {
+        buffer
+            .map(|x| T::to_be_bytes(&x))
+            .for_each(|x| arrow_data.extend_from_slice(x.as_ref()))
+    }
+}
+
+#[inline]
+fn _write_compressed_buffer_from_iter<T: NativeType, I: TrustedLen<Item = T>>(
+    buffer: I,
+    arrow_data: &mut Vec<u8>,
+    is_little_endian: bool,
+    compression: Compression,
+) {
+    let len = buffer.size_hint().0;
+    let mut swapped = Vec::with_capacity(len * std::mem::size_of::<T>());
+    if is_little_endian {
+        buffer
+            .map(|x| T::to_le_bytes(&x))
+            .for_each(|x| swapped.extend_from_slice(x.as_ref()));
+    } else {
+        buffer
+            .map(|x| T::to_be_bytes(&x))
+            .for_each(|x| swapped.extend_from_slice(x.as_ref()))
+    };
+    arrow_data.extend_from_slice(&(swapped.len() as i64).to_le_bytes());
+    match compression {
+        Compression::LZ4 => {
+            compression::compress_lz4(&swapped, arrow_data).unwrap();
+        },
+        Compression::ZSTD => {
+            compression::compress_zstd(&swapped, arrow_data).unwrap();
+        },
+    }
+}
+
+fn _write_buffer<T: NativeType>(buffer: &[T], arrow_data: &mut Vec<u8>, is_little_endian: bool) {
+    if is_little_endian == is_native_little_endian() {
+        // in native endianness we can use the bytes directly.
+        let buffer = bytemuck::cast_slice(buffer);
+        arrow_data.extend_from_slice(buffer);
+    } else {
+        _write_buffer_from_iter(buffer.iter().copied(), arrow_data, is_little_endian)
+    }
+}
+
+fn _write_compressed_buffer<T: NativeType>(
+    buffer: &[T],
+    arrow_data: &mut Vec<u8>,
+    is_little_endian: bool,
+    compression: Compression,
+) {
+    if is_little_endian == is_native_little_endian() {
+        let bytes = bytemuck::cast_slice(buffer);
+        arrow_data.extend_from_slice(&(bytes.len() as i64).to_le_bytes());
+        match compression {
+            Compression::LZ4 => {
+                compression::compress_lz4(bytes, arrow_data).unwrap();
+            },
+            Compression::ZSTD => {
+                compression::compress_zstd(bytes, arrow_data).unwrap();
+            },
+        }
+    } else {
+        todo!()
+    }
+}
+
+/// writes `bytes` to `arrow_data` updating `buffers` and `offset` and guaranteeing a 8 byte boundary.
+#[inline]
+fn write_buffer_from_iter<T: NativeType, I: TrustedLen<Item = T>>(
+    buffer: I,
+    buffers: &mut Vec<ipc::Buffer>,
+    arrow_data: &mut Vec<u8>,
+    offset: &mut i64,
+    is_little_endian: bool,
+    compression: Option<Compression>,
+) {
+    let start = arrow_data.len();
+
+    if let Some(compression) = compression {
+        _write_compressed_buffer_from_iter(buffer, arrow_data, is_little_endian, compression);
+    } else {
+        _write_buffer_from_iter(buffer, arrow_data, is_little_endian);
+    }
+
+    buffers.push(finish_buffer(arrow_data, start, offset));
+}
+
+fn finish_buffer(arrow_data: &mut Vec<u8>, start: usize, offset: &mut i64) -> ipc::Buffer {
+    let buffer_len = (arrow_data.len() - start) as i64;
+
+    pad_buffer_to_64(arrow_data, arrow_data.len() - start);
+    let total_len = (arrow_data.len() - start) as i64;
+
+    let buffer = ipc::Buffer {
+        offset: *offset,
+        length: buffer_len,
+    };
+    *offset += total_len;
+    buffer
+}
diff --git a/crates/nano-arrow/src/io/ipc/write/stream.rs b/crates/nano-arrow/src/io/ipc/write/stream.rs
new file mode 100644
index 000000000000..3fe7e143e02d
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/write/stream.rs
@@ -0,0 +1,113 @@
+//! Arrow IPC File and Stream Writers
+//!
+//! The `FileWriter` and `StreamWriter` have similar interfaces,
+//! however the `FileWriter` expects a reader that supports `Seek`ing
+
+use std::io::Write;
+
+use super::super::IpcField;
+use super::common::{encode_chunk, DictionaryTracker, EncodedData, WriteOptions};
+use super::common_sync::{write_continuation, write_message};
+use super::{default_ipc_fields, schema_to_bytes};
+use crate::array::Array;
+use crate::chunk::Chunk;
+use crate::datatypes::*;
+use crate::error::{Error, Result};
+
+/// Arrow stream writer
+///
+/// The data written by this writer must be read in order. To signal that no more
+/// data is arriving through the stream call [`self.finish()`](StreamWriter::finish);
+///
+/// For a usage walkthrough consult [this example](https://github.com/jorgecarleitao/arrow2/tree/main/examples/ipc_pyarrow).
+pub struct StreamWriter<W: Write> {
+    /// The object to write to
+    writer: W,
+    /// IPC write options
+    write_options: WriteOptions,
+    /// Whether the stream has been finished
+    finished: bool,
+    /// Keeps track of dictionaries that have been written
+    dictionary_tracker: DictionaryTracker,
+
+    ipc_fields: Option<Vec<IpcField>>,
+}
+
+impl<W: Write> StreamWriter<W> {
+    /// Creates a new [`StreamWriter`]
+    pub fn new(writer: W, write_options: WriteOptions) -> Self {
+        Self {
+            writer,
+            write_options,
+            finished: false,
+            dictionary_tracker: DictionaryTracker {
+                dictionaries: Default::default(),
+                cannot_replace: false,
+            },
+            ipc_fields: None,
+        }
+    }
+
+    /// Starts the stream by writing a Schema message to it.
+    /// Use `ipc_fields` to declare dictionary ids in the schema, for dictionary-reuse
+    pub fn start(&mut self, schema: &Schema, ipc_fields: Option<Vec<IpcField>>) -> Result<()> {
+        self.ipc_fields = Some(if let Some(ipc_fields) = ipc_fields {
+            ipc_fields
+        } else {
+            default_ipc_fields(&schema.fields)
+        });
+
+        let encoded_message = EncodedData {
+            ipc_message: schema_to_bytes(schema, self.ipc_fields.as_ref().unwrap()),
+            arrow_data: vec![],
+        };
+        write_message(&mut self.writer, &encoded_message)?;
+        Ok(())
+    }
+
+    /// Writes [`Chunk`] to the stream
+    pub fn write(
+        &mut self,
+        columns: &Chunk<Box<dyn Array>>,
+        ipc_fields: Option<&[IpcField]>,
+    ) -> Result<()> {
+        if self.finished {
+            return Err(Error::Io(std::io::Error::new(
+                std::io::ErrorKind::UnexpectedEof,
+                "Cannot write to a finished stream".to_string(),
+            )));
+        }
+
+        // we can't make it a closure because it borrows (and it can't borrow mut and non-mut below)
+        #[allow(clippy::or_fun_call)]
+        let fields = ipc_fields.unwrap_or(self.ipc_fields.as_ref().unwrap());
+
+        let (encoded_dictionaries, encoded_message) = encode_chunk(
+            columns,
+            fields,
+            &mut self.dictionary_tracker,
+            &self.write_options,
+        )?;
+
+        for encoded_dictionary in encoded_dictionaries {
+            write_message(&mut self.writer, &encoded_dictionary)?;
+        }
+
+        write_message(&mut self.writer, &encoded_message)?;
+        Ok(())
+    }
+
+    /// Write continuation bytes, and mark the stream as done
+    pub fn finish(&mut self) -> Result<()> {
+        write_continuation(&mut self.writer, 0)?;
+
+        self.finished = true;
+
+        Ok(())
+    }
+
+    /// Consumes itself, returning the inner writer.
+    pub fn into_inner(self) -> W {
+        self.writer
+    }
+}
diff --git a/crates/nano-arrow/src/io/ipc/write/stream_async.rs b/crates/nano-arrow/src/io/ipc/write/stream_async.rs
new file mode 100644
index 000000000000..7af62682935a
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/write/stream_async.rs
@@ -0,0 +1,188 @@
+//! `async` writing of arrow streams
+
+use std::pin::Pin;
+use std::task::Poll;
+
+use futures::future::BoxFuture;
+use futures::{AsyncWrite, AsyncWriteExt, FutureExt, Sink};
+
+use super::super::IpcField;
+pub use super::common::WriteOptions;
+use super::common::{encode_chunk, DictionaryTracker, EncodedData};
+use super::common_async::{write_continuation, write_message};
+use super::{default_ipc_fields, schema_to_bytes, Record};
+use crate::datatypes::*;
+use crate::error::{Error, Result};
+
+/// A sink that writes array [`chunks`](crate::chunk::Chunk) as an IPC stream.
+///
+/// The stream header is automatically written before writing the first chunk.
+///
+/// # Examples
+///
+/// ```
+/// use futures::SinkExt;
+/// use arrow2::array::{Array, Int32Array};
+/// use arrow2::datatypes::{DataType, Field, Schema};
+/// use arrow2::chunk::Chunk;
+/// # use arrow2::io::ipc::write::stream_async::StreamSink;
+/// # futures::executor::block_on(async move {
+/// let schema = Schema::from(vec![
+///     Field::new("values", DataType::Int32, true),
+/// ]);
+///
+/// let mut buffer = vec![];
+/// let mut sink = StreamSink::new(
+///     &mut buffer,
+///     &schema,
+///     None,
+///     Default::default(),
+/// );
+///
+/// for i in 0..3 {
+///     let values = Int32Array::from(&[Some(i), None]);
+///     let chunk = Chunk::new(vec![values.boxed()]);
+///     sink.feed(chunk.into()).await?;
+/// }
+/// sink.close().await?;
+/// # arrow2::error::Result::Ok(())
+/// # }).unwrap();
+/// ```
+pub struct StreamSink<'a, W: AsyncWrite + Unpin + Send + 'a> {
+    writer: Option<W>,
+    task: Option<BoxFuture<'a, Result<Option<W>>>>,
+    options: WriteOptions,
+    dictionary_tracker: DictionaryTracker,
+    fields: Vec<IpcField>,
+}
+
+impl<'a, W> StreamSink<'a, W>
+where
+    W: AsyncWrite + Unpin + Send + 'a,
+{
+    /// Create a new [`StreamSink`].
+    pub fn new(
+        writer: W,
+        schema: &Schema,
+        ipc_fields: Option<Vec<IpcField>>,
+        write_options: WriteOptions,
+    ) -> Self {
+        let fields = ipc_fields.unwrap_or_else(|| default_ipc_fields(&schema.fields));
+        let task = Some(Self::start(writer, schema, &fields[..]));
+        Self {
+            writer: None,
+            task,
+            fields,
+            dictionary_tracker: DictionaryTracker {
+                dictionaries: Default::default(),
+                cannot_replace: false,
+            },
+            options: write_options,
+        }
+    }
+
+    fn start(
+        mut writer: W,
+        schema: &Schema,
+        ipc_fields: &[IpcField],
+    ) -> BoxFuture<'a, Result<Option<W>>> {
+        let message = EncodedData {
+            ipc_message: schema_to_bytes(schema, ipc_fields),
+            arrow_data: vec![],
+        };
+        async move {
+            write_message(&mut writer, message).await?;
+            Ok(Some(writer))
+        }
+        .boxed()
+    }
+
+    fn write(&mut self, record: Record<'_>) -> Result<()> {
+        let fields = record.fields().unwrap_or(&self.fields[..]);
+        let (dictionaries, message) = encode_chunk(
+            record.columns(),
+            fields,
+            &mut self.dictionary_tracker,
+            &self.options,
+        )?;
+
+        if let Some(mut writer) = self.writer.take() {
+            self.task = Some(
+                async move {
+                    for d in dictionaries {
+                        write_message(&mut writer, d).await?;
+                    }
+                    write_message(&mut writer, message).await?;
+                    Ok(Some(writer))
+                }
+                .boxed(),
+            );
+            Ok(())
+        } else {
+            Err(Error::Io(std::io::Error::new(
+                std::io::ErrorKind::UnexpectedEof,
+                "writer closed".to_string(),
+            )))
+        }
+    }
+
+    fn poll_complete(&mut self, cx: &mut std::task::Context<'_>) -> Poll<Result<()>> {
+        if let Some(task) = &mut self.task {
+            match futures::ready!(task.poll_unpin(cx)) {
+                Ok(writer) => {
+                    self.writer = writer;
+                    self.task = None;
+                    Poll::Ready(Ok(()))
+                },
+                Err(error) => {
+                    self.task = None;
+                    Poll::Ready(Err(error))
+                },
+            }
+        } else {
+            Poll::Ready(Ok(()))
+        }
+    }
+}
+
+impl<'a, W> Sink<Record<'_>> for StreamSink<'a, W>
+where
+    W: AsyncWrite + Unpin + Send,
+{
+    type Error = Error;
+
+    fn poll_ready(self: Pin<&mut Self>, cx: &mut std::task::Context<'_>) -> Poll<Result<()>> {
+        self.get_mut().poll_complete(cx)
+    }
+
+    fn start_send(self: Pin<&mut Self>, item: Record<'_>) -> Result<()> {
+        self.get_mut().write(item)
+    }
+
+    fn poll_flush(self: Pin<&mut Self>, cx: &mut std::task::Context<'_>) -> Poll<Result<()>> {
+        self.get_mut().poll_complete(cx)
+    }
+
+    fn poll_close(self: Pin<&mut Self>, cx: &mut std::task::Context<'_>) -> Poll<Result<()>> {
+        let this = self.get_mut();
+        match this.poll_complete(cx) {
+            Poll::Ready(Ok(())) => {
+                if let Some(mut writer) = this.writer.take() {
+                    this.task = Some(
+                        async move {
+                            write_continuation(&mut writer, 0).await?;
+                            writer.flush().await?;
+                            writer.close().await?;
+                            Ok(None)
+                        }
+                        .boxed(),
+                    );
+                    this.poll_complete(cx)
+                } else {
+                    Poll::Ready(Ok(()))
+                }
+            },
+            res => res,
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/io/ipc/write/writer.rs b/crates/nano-arrow/src/io/ipc/write/writer.rs
new file mode 100644
index 000000000000..8fcdd2a8bd66
--- /dev/null
+++ b/crates/nano-arrow/src/io/ipc/write/writer.rs
@@ -0,0 +1,210 @@
+use std::io::Write;
+
+use arrow_format::ipc::planus::Builder;
+
+use super::super::{IpcField, ARROW_MAGIC_V2};
+use super::common::{DictionaryTracker, EncodedData, WriteOptions};
+use super::common_sync::{write_continuation, write_message};
+use super::{default_ipc_fields, schema, schema_to_bytes};
+use crate::array::Array;
+use crate::chunk::Chunk;
+use crate::datatypes::*;
+use crate::error::{Error, Result};
+use crate::io::ipc::write::common::encode_chunk_amortized;
+
+#[derive(Clone, Copy, PartialEq, Eq)]
+pub(crate) enum State {
+    None,
+    Started,
+    Finished,
+}
+
+/// Arrow file writer
+pub struct FileWriter<W: Write> {
+    /// The object to write to
+    pub(crate) writer: W,
+    /// IPC write options
+    pub(crate) options: WriteOptions,
+    /// A reference to the schema, used in validating record batches
+    pub(crate) schema: Schema,
+    pub(crate) ipc_fields: Vec<IpcField>,
+    /// The number of bytes between each block of bytes, as an offset for random access
+    pub(crate) block_offsets: usize,
+    /// Dictionary blocks that will be written as part of the IPC footer
+    pub(crate) dictionary_blocks: Vec<arrow_format::ipc::Block>,
+    /// Record blocks that will be written as part of the IPC footer
+    pub(crate) record_blocks: Vec<arrow_format::ipc::Block>,
+    /// Whether the writer footer has been written, and the writer is finished
+    pub(crate) state: State,
+    /// Keeps track of dictionaries that have been written
+    pub(crate) dictionary_tracker: DictionaryTracker,
+    /// Buffer/scratch that is reused between writes
+    pub(crate) encoded_message: EncodedData,
+}
+
+impl<W: Write> FileWriter<W> {
+    /// Creates a new [`FileWriter`] and writes the header to `writer`
+    pub fn try_new(
+        writer: W,
+        schema: Schema,
+        ipc_fields: Option<Vec<IpcField>>,
+        options: WriteOptions,
+    ) -> Result<Self> {
+        let mut slf = Self::new(writer, schema, ipc_fields, options);
+        slf.start()?;
+
+        Ok(slf)
+    }
+
+    /// Creates a new [`FileWriter`].
+    pub fn new(
+        writer: W,
+        schema: Schema,
+        ipc_fields: Option<Vec<IpcField>>,
+        options: WriteOptions,
+    ) -> Self {
+        let ipc_fields = if let Some(ipc_fields) = ipc_fields {
+            ipc_fields
+        } else {
+            default_ipc_fields(&schema.fields)
+        };
+
+        Self {
+            writer,
+            options,
+            schema,
+            ipc_fields,
+            block_offsets: 0,
+            dictionary_blocks: vec![],
+            record_blocks: vec![],
+            state: State::None,
+            dictionary_tracker: DictionaryTracker {
+                dictionaries: Default::default(),
+                cannot_replace: true,
+            },
+            encoded_message: Default::default(),
+        }
+    }
+
+    /// Consumes itself into the inner writer
+    pub fn into_inner(self) -> W {
+        self.writer
+    }
+
+    /// Get the inner memory scratches so they can be reused in a new writer.
+    /// This can be utilized to save memory allocations for performance reasons.
+    pub fn get_scratches(&mut self) -> EncodedData {
+        std::mem::take(&mut self.encoded_message)
+    }
+    /// Set the inner memory scratches so they can be reused in a new writer.
+    /// This can be utilized to save memory allocations for performance reasons.
+    pub fn set_scratches(&mut self, scratches: EncodedData) {
+        self.encoded_message = scratches;
+    }
+
+    /// Writes the header and first (schema) message to the file.
+    /// # Errors
+    /// Errors if the file has been started or has finished.
+    pub fn start(&mut self) -> Result<()> {
+        if self.state != State::None {
+            return Err(Error::oos("The IPC file can only be started once"));
+        }
+        // write magic to header
+        self.writer.write_all(&ARROW_MAGIC_V2[..])?;
+        // create an 8-byte boundary after the header
+        self.writer.write_all(&[0, 0])?;
+        // write the schema, set the written bytes to the schema
+
+        let encoded_message = EncodedData {
+            ipc_message: schema_to_bytes(&self.schema, &self.ipc_fields),
+            arrow_data: vec![],
+        };
+
+        let (meta, data) = write_message(&mut self.writer, &encoded_message)?;
+        self.block_offsets += meta + data + 8; // 8 <=> arrow magic + 2 bytes for alignment
+        self.state = State::Started;
+        Ok(())
+    }
+
+    /// Writes [`Chunk`] to the file
+    pub fn write(
+        &mut self,
+        chunk: &Chunk<Box<dyn Array>>,
+        ipc_fields: Option<&[IpcField]>,
+    ) -> Result<()> {
+        if self.state != State::Started {
+            return Err(Error::oos(
+                "The IPC file must be started before it can be written to. Call `start` before `write`",
+            ));
+        }
+
+        let ipc_fields = if let Some(ipc_fields) = ipc_fields {
+            ipc_fields
+        } else {
+            self.ipc_fields.as_ref()
+        };
+        let encoded_dictionaries = encode_chunk_amortized(
+            chunk,
+            ipc_fields,
+            &mut self.dictionary_tracker,
+            &self.options,
+            &mut self.encoded_message,
+        )?;
+
+        // add all dictionaries
+        for encoded_dictionary in encoded_dictionaries {
+            let (meta, data) = write_message(&mut self.writer, &encoded_dictionary)?;
+
+            let block = arrow_format::ipc::Block {
+                offset: self.block_offsets as i64,
+                meta_data_length: meta as i32,
+                body_length: data as i64,
+            };
+            self.dictionary_blocks.push(block);
+            self.block_offsets += meta + data;
+        }
+
+        let (meta, data) = write_message(&mut self.writer, &self.encoded_message)?;
+        // add a record block for the footer
+        let block = arrow_format::ipc::Block {
+            offset: self.block_offsets as i64,
+            meta_data_length: meta as i32, // TODO: is this still applicable?
+            body_length: data as i64,
+        };
+        self.record_blocks.push(block);
+        self.block_offsets += meta + data;
+        Ok(())
+    }
+
+    /// Write footer and closing tag, then mark the writer as done
+    pub fn finish(&mut self) -> Result<()> {
+        if self.state != State::Started {
+            return Err(Error::oos(
+                "The IPC file must be started before it can be finished. Call `start` before `finish`",
+            ));
+        }
+
+        // write EOS
+        write_continuation(&mut self.writer, 0)?;
+
+        let schema = schema::serialize_schema(&self.schema, &self.ipc_fields);
+
+        let root = arrow_format::ipc::Footer {
+            version: arrow_format::ipc::MetadataVersion::V5,
+            schema: Some(Box::new(schema)),
+            dictionaries: Some(std::mem::take(&mut self.dictionary_blocks)),
+            record_batches: Some(std::mem::take(&mut self.record_blocks)),
+            custom_metadata: None,
+        };
+        let mut builder = Builder::new();
+        let footer_data = builder.finish(&root, None);
+        self.writer.write_all(footer_data)?;
+        self.writer
+            .write_all(&(footer_data.len() as i32).to_le_bytes())?;
+        self.writer.write_all(&ARROW_MAGIC_V2)?;
+        self.writer.flush()?;
+        self.state = State::Finished;
+
+        Ok(())
+    }
+}
diff --git a/crates/nano-arrow/src/io/iterator.rs b/crates/nano-arrow/src/io/iterator.rs
new file mode 100644
index 000000000000..91ec86fc2e04
--- /dev/null
+++ b/crates/nano-arrow/src/io/iterator.rs
@@ -0,0 +1,65 @@
+pub use streaming_iterator::StreamingIterator;
+
+/// A [`StreamingIterator`] with an internal buffer of [`Vec<u8>`] used to efficiently
+/// present items of type `T` as `&[u8]`.
+/// It is generic over the type `T` and the transformation `F: T -> &[u8]`.
+pub struct BufStreamingIterator<I, F, T>
+where
+    I: Iterator<Item = T>,
+    F: FnMut(T, &mut Vec<u8>),
+{
+    iterator: I,
+    f: F,
+    buffer: Vec<u8>,
+    is_valid: bool,
+}
+
+impl<I, F, T> BufStreamingIterator<I, F, T>
+where
+    I: Iterator<Item = T>,
+    F: FnMut(T, &mut Vec<u8>),
+{
+    #[inline]
+    pub fn new(iterator: I, f: F, buffer: Vec<u8>) -> Self {
+        Self {
+            iterator,
+            f,
+            buffer,
+            is_valid: false,
+        }
+    }
+}
+
+impl<I, F, T> StreamingIterator for BufStreamingIterator<I, F, T>
+where
+    I: Iterator<Item = T>,
+    F: FnMut(T, &mut Vec<u8>),
+{
+    type Item = [u8];
+
+    #[inline]
+    fn advance(&mut self) {
+        let a = self.iterator.next();
+        if let Some(a) = a {
+            self.is_valid = true;
+            self.buffer.clear();
+            (self.f)(a, &mut self.buffer);
+        } else {
+            self.is_valid = false;
+        }
+    }
+
+    #[inline]
+    fn get(&self) -> Option<&Self::Item> {
+        if self.is_valid {
+            Some(&self.buffer)
+        } else {
+            None
+        }
+    }
+
+    #[inline]
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        self.iterator.size_hint()
+    }
+}
diff --git a/crates/nano-arrow/src/io/mod.rs b/crates/nano-arrow/src/io/mod.rs
new file mode 100644
index 000000000000..72bf37ba9ea5
--- /dev/null
+++ b/crates/nano-arrow/src/io/mod.rs
@@ -0,0 +1,21 @@
+#![forbid(unsafe_code)]
+//! Contains modules to interface with other formats such as [`csv`],
+//! [`parquet`], [`json`], [`ipc`], [`mod@print`] and [`avro`].
+
+#[cfg(feature = "io_ipc")]
+#[cfg_attr(docsrs, doc(cfg(feature = "io_ipc")))]
+pub mod ipc;
+
+#[cfg(feature = "io_flight")]
+#[cfg_attr(docsrs, doc(cfg(feature = "io_flight")))]
+pub mod flight;
+
+#[cfg(feature = "io_parquet")]
+#[cfg_attr(docsrs, doc(cfg(feature = "io_parquet")))]
+pub mod parquet;
+
+#[cfg(feature = "io_avro")]
+#[cfg_attr(docsrs, doc(cfg(feature = "io_avro")))]
+pub mod avro;
+
+pub mod iterator;
diff --git a/crates/nano-arrow/src/io/parquet/mod.rs b/crates/nano-arrow/src/io/parquet/mod.rs
new file mode 100644
index 000000000000..04e5693fcfe6
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/mod.rs
@@ -0,0 +1,31 @@
+//! APIs to read from and write to Parquet format.
+use crate::error::Error;
+
+pub mod read;
+pub mod write;
+
+#[cfg(feature = "io_parquet_bloom_filter")]
+#[cfg_attr(docsrs, doc(cfg(feature = "io_parquet_bloom_filter")))]
+pub use parquet2::bloom_filter;
+
+const ARROW_SCHEMA_META_KEY: &str = "ARROW:schema";
+
+impl From<parquet2::error::Error> for Error {
+    fn from(error: parquet2::error::Error) -> Self {
+        match error {
+            parquet2::error::Error::FeatureNotActive(_, _) => {
+                let message = "Failed to read a compressed parquet file. \
+                    Use the cargo feature \"io_parquet_compression\" to read compressed parquet files."
+                    .to_string();
+                Error::ExternalFormat(message)
+            },
+            _ => Error::ExternalFormat(error.to_string()),
+        }
+    }
+}
+
+impl From<Error> for parquet2::error::Error {
+    fn from(error: Error) -> Self {
+        parquet2::error::Error::OutOfSpec(error.to_string())
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/README.md b/crates/nano-arrow/src/io/parquet/read/README.md
new file mode 100644
index 000000000000..c36aaafaf79a
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/README.md
@@ -0,0 +1,36 @@
+## Observations
+
+### LSB equivalence between definition levels and bitmaps
+
+When the maximum repetition level is 0 and the maximum definition level is 1,
+the RLE-encoded definition levels correspond exactly to Arrow's bitmap and can be
+memcopied without further transformations.
+
+## Nested parquet groups are deserialized recursively
+
+Reading a parquet nested field is done by reading each primitive
+column sequentially, and build the nested struct recursively.
+
+Rows of nested parquet groups are encoded in the repetition and definition levels.
+In arrow, they correspond to:
+
+- list's offsets and validity
+- struct's validity
+
+The implementation in this module leverages this observation:
+
+Nested parquet fields are initially recursed over to gather
+whether the type is a Struct or List, and whether it is required or optional, which we store
+in `nested_info: Vec<Box<dyn Nested>>`. `Nested` is a trait object that receives definition
+and repetition levels depending on the type and nullability of the nested item.
+We process the definition and repetition levels into `nested_info`.
+
+When we finish a field, we recursively pop from `nested_info` as we build
+the `StructArray` or `ListArray`.
+
+With this approach, the only difference vs flat is:
+
+1. we do not leverage the bitmap optimization, and instead need to deserialize the repetition
+   and definition levels to `i32`.
+2. we deserialize definition levels twice, once to extend the values/nullability and
+   one to extend `nested_info`.
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/README.md b/crates/nano-arrow/src/io/parquet/read/deserialize/README.md
new file mode 100644
index 000000000000..5b985bac8e9b
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/README.md
@@ -0,0 +1,71 @@
+# Design
+
+## Non-nested types
+
+Let's start with the design used for non-nested arrays. The (private) entry point of this
+module for non-nested arrays is `simple::page_iter_to_arrays`.
+
+This function expects
+
+- a (fallible) streaming iterator of decompressed and encoded pages, `Pages`
+- the source (parquet) column type, including its logical information
+- the target (arrow) `DataType`
+- the chunk size
+
+and returns an iterator of `Array`, `ArrayIter`.
+
+This design is shared among _all_ `(parquet, arrow)` implemented tuples. Their main
+difference is how they are deserialized, which depends on the source and target types.
+
+When the array iterator is pulled the first time, the following happens:
+
+- a page from `Pages` is pulled
+- a `PageState<'a>` is built from the page
+- the `PageState` is consumed into a mutable array:
+  - if `chunk_size` is larger than the number of rows in the page, the mutable array state is preserved and a new page is pulled and the process repeated until we fill a chunk.
+  - if `chunk_size` is smaller than the number of rows in the page, the mutable array state
+    is returned and the remaining of the page is consumed into multiple mutable arrays of length `chunk_size` into a FIFO queue.
+
+Subsequent pulls of arrays will first try to pull from the FIFO queue. Once the queue is empty, the
+a new page is pulled.
+
+### `PageState`
+
+As mentioned above, the iterator leverages the idea that we attach a state to a page. Recall
+that a page is essentially `[header][data]`. The `data` part contains encoded
+`[rep levels][def levels][non-null values]`. Some pages have an associated dictionary page,
+in which case the `non-null values` represent the indices.
+
+Irrespectively of the physical type, the main idea is to split the page in two iterators:
+
+- An iterator over `def levels`
+- An iterator over `non-null values`
+
+and progress the iterators as needed. In particular, for non-nested types, `def levels` is
+a bitmap with the same representation as Arrow, in which case the validity is extended directly.
+
+The `non-null values` are "expanded" by filling null values with the default value of each physical
+type.
+
+## Nested types
+
+For nested type with N+1 levels (1 is the primitive), we need to build the nest information of each
+N levels + the non-nested Arrow array.
+
+This is done by first transversing the parquet types and using it to initialize, per chunk, the N levels.
+
+The per-chunk execution is then similar but `chunk_size` only drives the number of retrieved
+rows from the outermost parquet group (the field). Each of these pulls knows how many items need
+to be pulled from the inner groups, all the way to the primitive type. This works because
+in parquet a row cannot be split between two pages and thus each page is guaranteed
+to contain a full row.
+
+The `PageState` of nested types is composed by 4 iterators:
+
+- A (zipped) iterator over `rep levels` and `def levels`
+- An iterator over `def levels`
+- An iterator over `non-null values`
+
+The idea is that an iterator of `rep, def` contain all the information to decode the
+nesting structure of an arrow array. The other two iterators are equivalent to the non-nested
+types with the exception that `def levels` are no equivalent to arrow bitmaps.
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/binary/basic.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/binary/basic.rs
new file mode 100644
index 000000000000..6008dd9de005
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/binary/basic.rs
@@ -0,0 +1,516 @@
+use std::collections::VecDeque;
+use std::default::Default;
+
+use parquet2::deserialize::SliceFilteredIter;
+use parquet2::encoding::{delta_length_byte_array, hybrid_rle, Encoding};
+use parquet2::page::{split_buffer, DataPage, DictPage};
+use parquet2::schema::Repetition;
+
+use super::super::utils::{
+    extend_from_decoder, get_selected_rows, next, DecodedState, FilteredOptionalPageValidity,
+    MaybeNext, OptionalPageValidity,
+};
+use super::super::{utils, Pages};
+use super::utils::*;
+use crate::array::{Array, BinaryArray, Utf8Array};
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::{DataType, PhysicalType};
+use crate::error::{Error, Result};
+use crate::offset::Offset;
+
+#[derive(Debug)]
+pub(super) struct Required<'a> {
+    pub values: SizedBinaryIter<'a>,
+}
+
+impl<'a> Required<'a> {
+    pub fn try_new(page: &'a DataPage) -> Result<Self> {
+        let (_, _, values) = split_buffer(page)?;
+        let values = SizedBinaryIter::new(values, page.num_values());
+
+        Ok(Self { values })
+    }
+
+    pub fn len(&self) -> usize {
+        self.values.size_hint().0
+    }
+}
+
+#[derive(Debug)]
+pub(super) struct Delta<'a> {
+    pub lengths: std::vec::IntoIter<usize>,
+    pub values: &'a [u8],
+}
+
+impl<'a> Delta<'a> {
+    pub fn try_new(page: &'a DataPage) -> Result<Self> {
+        let (_, _, values) = split_buffer(page)?;
+
+        let mut lengths_iter = delta_length_byte_array::Decoder::try_new(values)?;
+
+        #[allow(clippy::needless_collect)] // we need to consume it to get the values
+        let lengths = lengths_iter
+            .by_ref()
+            .map(|x| x.map(|x| x as usize).map_err(Error::from))
+            .collect::<Result<Vec<_>>>()?;
+
+        let values = lengths_iter.into_values();
+        Ok(Self {
+            lengths: lengths.into_iter(),
+            values,
+        })
+    }
+
+    pub fn len(&self) -> usize {
+        self.lengths.size_hint().0
+    }
+}
+
+impl<'a> Iterator for Delta<'a> {
+    type Item = &'a [u8];
+
+    #[inline]
+    fn next(&mut self) -> Option<Self::Item> {
+        let length = self.lengths.next()?;
+        let (item, remaining) = self.values.split_at(length);
+        self.values = remaining;
+        Some(item)
+    }
+
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        self.lengths.size_hint()
+    }
+}
+
+#[derive(Debug)]
+pub(super) struct FilteredRequired<'a> {
+    pub values: SliceFilteredIter<SizedBinaryIter<'a>>,
+}
+
+impl<'a> FilteredRequired<'a> {
+    pub fn new(page: &'a DataPage) -> Self {
+        let values = SizedBinaryIter::new(page.buffer(), page.num_values());
+
+        let rows = get_selected_rows(page);
+        let values = SliceFilteredIter::new(values, rows);
+
+        Self { values }
+    }
+
+    pub fn len(&self) -> usize {
+        self.values.size_hint().0
+    }
+}
+
+#[derive(Debug)]
+pub(super) struct FilteredDelta<'a> {
+    pub values: SliceFilteredIter<Delta<'a>>,
+}
+
+impl<'a> FilteredDelta<'a> {
+    pub fn try_new(page: &'a DataPage) -> Result<Self> {
+        let values = Delta::try_new(page)?;
+
+        let rows = get_selected_rows(page);
+        let values = SliceFilteredIter::new(values, rows);
+
+        Ok(Self { values })
+    }
+
+    pub fn len(&self) -> usize {
+        self.values.size_hint().0
+    }
+}
+
+pub(super) type Dict = Vec<Vec<u8>>;
+
+#[derive(Debug)]
+pub(super) struct RequiredDictionary<'a> {
+    pub values: hybrid_rle::HybridRleDecoder<'a>,
+    pub dict: &'a Dict,
+}
+
+impl<'a> RequiredDictionary<'a> {
+    pub fn try_new(page: &'a DataPage, dict: &'a Dict) -> Result<Self> {
+        let values = utils::dict_indices_decoder(page)?;
+
+        Ok(Self { dict, values })
+    }
+
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.values.size_hint().0
+    }
+}
+
+#[derive(Debug)]
+pub(super) struct FilteredRequiredDictionary<'a> {
+    pub values: SliceFilteredIter<hybrid_rle::HybridRleDecoder<'a>>,
+    pub dict: &'a Dict,
+}
+
+impl<'a> FilteredRequiredDictionary<'a> {
+    pub fn try_new(page: &'a DataPage, dict: &'a Dict) -> Result<Self> {
+        let values = utils::dict_indices_decoder(page)?;
+
+        let rows = get_selected_rows(page);
+        let values = SliceFilteredIter::new(values, rows);
+
+        Ok(Self { values, dict })
+    }
+
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.values.size_hint().0
+    }
+}
+
+#[derive(Debug)]
+pub(super) struct ValuesDictionary<'a> {
+    pub values: hybrid_rle::HybridRleDecoder<'a>,
+    pub dict: &'a Dict,
+}
+
+impl<'a> ValuesDictionary<'a> {
+    pub fn try_new(page: &'a DataPage, dict: &'a Dict) -> Result<Self> {
+        let values = utils::dict_indices_decoder(page)?;
+
+        Ok(Self { dict, values })
+    }
+
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.values.size_hint().0
+    }
+}
+
+#[derive(Debug)]
+enum State<'a> {
+    Optional(OptionalPageValidity<'a>, BinaryIter<'a>),
+    Required(Required<'a>),
+    RequiredDictionary(RequiredDictionary<'a>),
+    OptionalDictionary(OptionalPageValidity<'a>, ValuesDictionary<'a>),
+    Delta(Delta<'a>),
+    OptionalDelta(OptionalPageValidity<'a>, Delta<'a>),
+    FilteredRequired(FilteredRequired<'a>),
+    FilteredDelta(FilteredDelta<'a>),
+    FilteredOptionalDelta(FilteredOptionalPageValidity<'a>, Delta<'a>),
+    FilteredOptional(FilteredOptionalPageValidity<'a>, BinaryIter<'a>),
+    FilteredRequiredDictionary(FilteredRequiredDictionary<'a>),
+    FilteredOptionalDictionary(FilteredOptionalPageValidity<'a>, ValuesDictionary<'a>),
+}
+
+impl<'a> utils::PageState<'a> for State<'a> {
+    fn len(&self) -> usize {
+        match self {
+            State::Optional(validity, _) => validity.len(),
+            State::Required(state) => state.len(),
+            State::Delta(state) => state.len(),
+            State::OptionalDelta(state, _) => state.len(),
+            State::RequiredDictionary(values) => values.len(),
+            State::OptionalDictionary(optional, _) => optional.len(),
+            State::FilteredRequired(state) => state.len(),
+            State::FilteredOptional(validity, _) => validity.len(),
+            State::FilteredDelta(state) => state.len(),
+            State::FilteredOptionalDelta(state, _) => state.len(),
+            State::FilteredRequiredDictionary(values) => values.len(),
+            State::FilteredOptionalDictionary(optional, _) => optional.len(),
+        }
+    }
+}
+
+impl<O: Offset> DecodedState for (Binary<O>, MutableBitmap) {
+    fn len(&self) -> usize {
+        self.0.len()
+    }
+}
+
+#[derive(Debug, Default)]
+struct BinaryDecoder<O: Offset> {
+    phantom_o: std::marker::PhantomData<O>,
+}
+
+impl<'a, O: Offset> utils::Decoder<'a> for BinaryDecoder<O> {
+    type State = State<'a>;
+    type Dict = Dict;
+    type DecodedState = (Binary<O>, MutableBitmap);
+
+    fn build_state(&self, page: &'a DataPage, dict: Option<&'a Self::Dict>) -> Result<Self::State> {
+        let is_optional =
+            page.descriptor.primitive_type.field_info.repetition == Repetition::Optional;
+        let is_filtered = page.selected_rows().is_some();
+
+        match (page.encoding(), dict, is_optional, is_filtered) {
+            (Encoding::PlainDictionary | Encoding::RleDictionary, Some(dict), false, false) => Ok(
+                State::RequiredDictionary(RequiredDictionary::try_new(page, dict)?),
+            ),
+            (Encoding::PlainDictionary | Encoding::RleDictionary, Some(dict), true, false) => {
+                Ok(State::OptionalDictionary(
+                    OptionalPageValidity::try_new(page)?,
+                    ValuesDictionary::try_new(page, dict)?,
+                ))
+            },
+            (Encoding::PlainDictionary | Encoding::RleDictionary, Some(dict), false, true) => {
+                FilteredRequiredDictionary::try_new(page, dict)
+                    .map(State::FilteredRequiredDictionary)
+            },
+            (Encoding::PlainDictionary | Encoding::RleDictionary, Some(dict), true, true) => {
+                Ok(State::FilteredOptionalDictionary(
+                    FilteredOptionalPageValidity::try_new(page)?,
+                    ValuesDictionary::try_new(page, dict)?,
+                ))
+            },
+            (Encoding::Plain, _, true, false) => {
+                let (_, _, values) = split_buffer(page)?;
+
+                let values = BinaryIter::new(values);
+
+                Ok(State::Optional(
+                    OptionalPageValidity::try_new(page)?,
+                    values,
+                ))
+            },
+            (Encoding::Plain, _, false, false) => Ok(State::Required(Required::try_new(page)?)),
+            (Encoding::Plain, _, false, true) => {
+                Ok(State::FilteredRequired(FilteredRequired::new(page)))
+            },
+            (Encoding::Plain, _, true, true) => {
+                let (_, _, values) = split_buffer(page)?;
+
+                Ok(State::FilteredOptional(
+                    FilteredOptionalPageValidity::try_new(page)?,
+                    BinaryIter::new(values),
+                ))
+            },
+            (Encoding::DeltaLengthByteArray, _, false, false) => {
+                Delta::try_new(page).map(State::Delta)
+            },
+            (Encoding::DeltaLengthByteArray, _, true, false) => Ok(State::OptionalDelta(
+                OptionalPageValidity::try_new(page)?,
+                Delta::try_new(page)?,
+            )),
+            (Encoding::DeltaLengthByteArray, _, false, true) => {
+                FilteredDelta::try_new(page).map(State::FilteredDelta)
+            },
+            (Encoding::DeltaLengthByteArray, _, true, true) => Ok(State::FilteredOptionalDelta(
+                FilteredOptionalPageValidity::try_new(page)?,
+                Delta::try_new(page)?,
+            )),
+            _ => Err(utils::not_implemented(page)),
+        }
+    }
+
+    fn with_capacity(&self, capacity: usize) -> Self::DecodedState {
+        (
+            Binary::<O>::with_capacity(capacity),
+            MutableBitmap::with_capacity(capacity),
+        )
+    }
+
+    fn extend_from_state(
+        &self,
+        state: &mut Self::State,
+        decoded: &mut Self::DecodedState,
+        additional: usize,
+    ) {
+        let (values, validity) = decoded;
+        match state {
+            State::Optional(page_validity, page_values) => extend_from_decoder(
+                validity,
+                page_validity,
+                Some(additional),
+                values,
+                page_values,
+            ),
+            State::Required(page) => {
+                for x in page.values.by_ref().take(additional) {
+                    values.push(x)
+                }
+            },
+            State::Delta(page) => {
+                values.extend_lengths(page.lengths.by_ref().take(additional), &mut page.values);
+            },
+            State::OptionalDelta(page_validity, page_values) => {
+                let Binary {
+                    offsets,
+                    values: values_,
+                } = values;
+
+                let last_offset = *offsets.last();
+                extend_from_decoder(
+                    validity,
+                    page_validity,
+                    Some(additional),
+                    offsets,
+                    page_values.lengths.by_ref(),
+                );
+
+                let length = *offsets.last() - last_offset;
+
+                let (consumed, remaining) = page_values.values.split_at(length.to_usize());
+                page_values.values = remaining;
+                values_.extend_from_slice(consumed);
+            },
+            State::FilteredRequired(page) => {
+                for x in page.values.by_ref().take(additional) {
+                    values.push(x)
+                }
+            },
+            State::FilteredDelta(page) => {
+                for x in page.values.by_ref().take(additional) {
+                    values.push(x)
+                }
+            },
+            State::OptionalDictionary(page_validity, page_values) => {
+                let page_dict = &page_values.dict;
+                utils::extend_from_decoder(
+                    validity,
+                    page_validity,
+                    Some(additional),
+                    values,
+                    &mut page_values
+                        .values
+                        .by_ref()
+                        .map(|index| page_dict[index.unwrap() as usize].as_ref()),
+                )
+            },
+            State::RequiredDictionary(page) => {
+                let page_dict = &page.dict;
+
+                for x in page
+                    .values
+                    .by_ref()
+                    .map(|index| page_dict[index.unwrap() as usize].as_ref())
+                    .take(additional)
+                {
+                    values.push(x)
+                }
+            },
+            State::FilteredOptional(page_validity, page_values) => {
+                utils::extend_from_decoder(
+                    validity,
+                    page_validity,
+                    Some(additional),
+                    values,
+                    page_values.by_ref(),
+                );
+            },
+            State::FilteredOptionalDelta(page_validity, page_values) => {
+                utils::extend_from_decoder(
+                    validity,
+                    page_validity,
+                    Some(additional),
+                    values,
+                    page_values.by_ref(),
+                );
+            },
+            State::FilteredRequiredDictionary(page) => {
+                let page_dict = &page.dict;
+                for x in page
+                    .values
+                    .by_ref()
+                    .map(|index| page_dict[index.unwrap() as usize].as_ref())
+                    .take(additional)
+                {
+                    values.push(x)
+                }
+            },
+            State::FilteredOptionalDictionary(page_validity, page_values) => {
+                let page_dict = &page_values.dict;
+                utils::extend_from_decoder(
+                    validity,
+                    page_validity,
+                    Some(additional),
+                    values,
+                    &mut page_values
+                        .values
+                        .by_ref()
+                        .map(|index| page_dict[index.unwrap() as usize].as_ref()),
+                )
+            },
+        }
+    }
+
+    fn deserialize_dict(&self, page: &DictPage) -> Self::Dict {
+        deserialize_plain(&page.buffer, page.num_values)
+    }
+}
+
+pub(super) fn finish<O: Offset>(
+    data_type: &DataType,
+    mut values: Binary<O>,
+    mut validity: MutableBitmap,
+) -> Result<Box<dyn Array>> {
+    values.offsets.shrink_to_fit();
+    values.values.shrink_to_fit();
+    validity.shrink_to_fit();
+
+    match data_type.to_physical_type() {
+        PhysicalType::Binary | PhysicalType::LargeBinary => BinaryArray::<O>::try_new(
+            data_type.clone(),
+            values.offsets.into(),
+            values.values.into(),
+            validity.into(),
+        )
+        .map(|x| x.boxed()),
+        PhysicalType::Utf8 | PhysicalType::LargeUtf8 => Utf8Array::<O>::try_new(
+            data_type.clone(),
+            values.offsets.into(),
+            values.values.into(),
+            validity.into(),
+        )
+        .map(|x| x.boxed()),
+        _ => unreachable!(),
+    }
+}
+
+pub struct Iter<O: Offset, I: Pages> {
+    iter: I,
+    data_type: DataType,
+    items: VecDeque<(Binary<O>, MutableBitmap)>,
+    dict: Option<Dict>,
+    chunk_size: Option<usize>,
+    remaining: usize,
+}
+
+impl<O: Offset, I: Pages> Iter<O, I> {
+    pub fn new(iter: I, data_type: DataType, chunk_size: Option<usize>, num_rows: usize) -> Self {
+        Self {
+            iter,
+            data_type,
+            items: VecDeque::new(),
+            dict: None,
+            chunk_size,
+            remaining: num_rows,
+        }
+    }
+}
+
+impl<O: Offset, I: Pages> Iterator for Iter<O, I> {
+    type Item = Result<Box<dyn Array>>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        let maybe_state = next(
+            &mut self.iter,
+            &mut self.items,
+            &mut self.dict,
+            &mut self.remaining,
+            self.chunk_size,
+            &BinaryDecoder::<O>::default(),
+        );
+        match maybe_state {
+            MaybeNext::Some(Ok((values, validity))) => {
+                Some(finish(&self.data_type, values, validity))
+            },
+            MaybeNext::Some(Err(e)) => Some(Err(e)),
+            MaybeNext::None => None,
+            MaybeNext::More => self.next(),
+        }
+    }
+}
+
+pub(super) fn deserialize_plain(values: &[u8], num_values: usize) -> Dict {
+    SizedBinaryIter::new(values, num_values)
+        .map(|x| x.to_vec())
+        .collect()
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/binary/dictionary.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/binary/dictionary.rs
new file mode 100644
index 000000000000..0fb3615de050
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/binary/dictionary.rs
@@ -0,0 +1,174 @@
+use std::collections::VecDeque;
+
+use parquet2::page::DictPage;
+
+use super::super::dictionary::*;
+use super::super::utils::MaybeNext;
+use super::super::Pages;
+use super::utils::{Binary, SizedBinaryIter};
+use crate::array::{Array, BinaryArray, DictionaryArray, DictionaryKey, Utf8Array};
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::{DataType, PhysicalType};
+use crate::error::Result;
+use crate::io::parquet::read::deserialize::nested_utils::{InitNested, NestedState};
+use crate::offset::Offset;
+
+/// An iterator adapter over [`Pages`] assumed to be encoded as parquet's dictionary-encoded binary representation
+#[derive(Debug)]
+pub struct DictIter<K, O, I>
+where
+    I: Pages,
+    O: Offset,
+    K: DictionaryKey,
+{
+    iter: I,
+    data_type: DataType,
+    values: Option<Box<dyn Array>>,
+    items: VecDeque<(Vec<K>, MutableBitmap)>,
+    remaining: usize,
+    chunk_size: Option<usize>,
+    phantom: std::marker::PhantomData<O>,
+}
+
+impl<K, O, I> DictIter<K, O, I>
+where
+    K: DictionaryKey,
+    O: Offset,
+    I: Pages,
+{
+    pub fn new(iter: I, data_type: DataType, num_rows: usize, chunk_size: Option<usize>) -> Self {
+        Self {
+            iter,
+            data_type,
+            values: None,
+            items: VecDeque::new(),
+            remaining: num_rows,
+            chunk_size,
+            phantom: std::marker::PhantomData,
+        }
+    }
+}
+
+fn read_dict<O: Offset>(data_type: DataType, dict: &DictPage) -> Box<dyn Array> {
+    let data_type = match data_type {
+        DataType::Dictionary(_, values, _) => *values,
+        _ => data_type,
+    };
+
+    let values = SizedBinaryIter::new(&dict.buffer, dict.num_values);
+
+    let mut data = Binary::<O>::with_capacity(dict.num_values);
+    data.values = Vec::with_capacity(dict.buffer.len() - 4 * dict.num_values);
+    for item in values {
+        data.push(item)
+    }
+
+    match data_type.to_physical_type() {
+        PhysicalType::Utf8 | PhysicalType::LargeUtf8 => {
+            Utf8Array::<O>::new(data_type, data.offsets.into(), data.values.into(), None).boxed()
+        },
+        PhysicalType::Binary | PhysicalType::LargeBinary => {
+            BinaryArray::<O>::new(data_type, data.offsets.into(), data.values.into(), None).boxed()
+        },
+        _ => unreachable!(),
+    }
+}
+
+impl<K, O, I> Iterator for DictIter<K, O, I>
+where
+    I: Pages,
+    O: Offset,
+    K: DictionaryKey,
+{
+    type Item = Result<DictionaryArray<K>>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        let maybe_state = next_dict(
+            &mut self.iter,
+            &mut self.items,
+            &mut self.values,
+            self.data_type.clone(),
+            &mut self.remaining,
+            self.chunk_size,
+            |dict| read_dict::<O>(self.data_type.clone(), dict),
+        );
+        match maybe_state {
+            MaybeNext::Some(Ok(dict)) => Some(Ok(dict)),
+            MaybeNext::Some(Err(e)) => Some(Err(e)),
+            MaybeNext::None => None,
+            MaybeNext::More => self.next(),
+        }
+    }
+}
+
+/// An iterator adapter that converts [`DataPages`] into an [`Iterator`] of [`DictionaryArray`]
+#[derive(Debug)]
+pub struct NestedDictIter<K, O, I>
+where
+    I: Pages,
+    O: Offset,
+    K: DictionaryKey,
+{
+    iter: I,
+    init: Vec<InitNested>,
+    data_type: DataType,
+    values: Option<Box<dyn Array>>,
+    items: VecDeque<(NestedState, (Vec<K>, MutableBitmap))>,
+    remaining: usize,
+    chunk_size: Option<usize>,
+    phantom: std::marker::PhantomData<O>,
+}
+
+impl<K, O, I> NestedDictIter<K, O, I>
+where
+    I: Pages,
+    O: Offset,
+    K: DictionaryKey,
+{
+    pub fn new(
+        iter: I,
+        init: Vec<InitNested>,
+        data_type: DataType,
+        num_rows: usize,
+        chunk_size: Option<usize>,
+    ) -> Self {
+        Self {
+            iter,
+            init,
+            data_type,
+            values: None,
+            items: VecDeque::new(),
+            remaining: num_rows,
+            chunk_size,
+            phantom: Default::default(),
+        }
+    }
+}
+
+impl<K, O, I> Iterator for NestedDictIter<K, O, I>
+where
+    I: Pages,
+    O: Offset,
+    K: DictionaryKey,
+{
+    type Item = Result<(NestedState, DictionaryArray<K>)>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        let maybe_state = nested_next_dict(
+            &mut self.iter,
+            &mut self.items,
+            &mut self.remaining,
+            &self.init,
+            &mut self.values,
+            self.data_type.clone(),
+            self.chunk_size,
+            |dict| read_dict::<O>(self.data_type.clone(), dict),
+        );
+        match maybe_state {
+            MaybeNext::Some(Ok(dict)) => Some(Ok(dict)),
+            MaybeNext::Some(Err(e)) => Some(Err(e)),
+            MaybeNext::None => None,
+            MaybeNext::More => self.next(),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/binary/mod.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/binary/mod.rs
new file mode 100644
index 000000000000..c48bfe276bcc
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/binary/mod.rs
@@ -0,0 +1,8 @@
+mod basic;
+mod dictionary;
+mod nested;
+mod utils;
+
+pub use basic::Iter;
+pub use dictionary::{DictIter, NestedDictIter};
+pub use nested::NestedIter;
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/binary/nested.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/binary/nested.rs
new file mode 100644
index 000000000000..64f076932e49
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/binary/nested.rs
@@ -0,0 +1,187 @@
+use std::collections::VecDeque;
+
+use parquet2::encoding::Encoding;
+use parquet2::page::{split_buffer, DataPage, DictPage};
+use parquet2::schema::Repetition;
+
+use super::super::nested_utils::*;
+use super::super::utils;
+use super::super::utils::MaybeNext;
+use super::basic::{deserialize_plain, finish, Dict, ValuesDictionary};
+use super::utils::*;
+use crate::array::Array;
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::DataType;
+use crate::error::Result;
+use crate::io::parquet::read::Pages;
+use crate::offset::Offset;
+
+#[derive(Debug)]
+enum State<'a> {
+    Optional(BinaryIter<'a>),
+    Required(BinaryIter<'a>),
+    RequiredDictionary(ValuesDictionary<'a>),
+    OptionalDictionary(ValuesDictionary<'a>),
+}
+
+impl<'a> utils::PageState<'a> for State<'a> {
+    fn len(&self) -> usize {
+        match self {
+            State::Optional(validity) => validity.size_hint().0,
+            State::Required(state) => state.size_hint().0,
+            State::RequiredDictionary(required) => required.len(),
+            State::OptionalDictionary(optional) => optional.len(),
+        }
+    }
+}
+
+#[derive(Debug, Default)]
+struct BinaryDecoder<O: Offset> {
+    phantom_o: std::marker::PhantomData<O>,
+}
+
+impl<'a, O: Offset> NestedDecoder<'a> for BinaryDecoder<O> {
+    type State = State<'a>;
+    type Dictionary = Dict;
+    type DecodedState = (Binary<O>, MutableBitmap);
+
+    fn build_state(
+        &self,
+        page: &'a DataPage,
+        dict: Option<&'a Self::Dictionary>,
+    ) -> Result<Self::State> {
+        let is_optional =
+            page.descriptor.primitive_type.field_info.repetition == Repetition::Optional;
+        let is_filtered = page.selected_rows().is_some();
+
+        match (page.encoding(), dict, is_optional, is_filtered) {
+            (Encoding::PlainDictionary | Encoding::RleDictionary, Some(dict), false, false) => {
+                ValuesDictionary::try_new(page, dict).map(State::RequiredDictionary)
+            },
+            (Encoding::PlainDictionary | Encoding::RleDictionary, Some(dict), true, false) => {
+                ValuesDictionary::try_new(page, dict).map(State::OptionalDictionary)
+            },
+            (Encoding::Plain, _, true, false) => {
+                let (_, _, values) = split_buffer(page)?;
+
+                let values = BinaryIter::new(values);
+
+                Ok(State::Optional(values))
+            },
+            (Encoding::Plain, _, false, false) => {
+                let (_, _, values) = split_buffer(page)?;
+
+                let values = BinaryIter::new(values);
+
+                Ok(State::Required(values))
+            },
+            _ => Err(utils::not_implemented(page)),
+        }
+    }
+
+    fn with_capacity(&self, capacity: usize) -> Self::DecodedState {
+        (
+            Binary::<O>::with_capacity(capacity),
+            MutableBitmap::with_capacity(capacity),
+        )
+    }
+
+    fn push_valid(&self, state: &mut Self::State, decoded: &mut Self::DecodedState) -> Result<()> {
+        let (values, validity) = decoded;
+        match state {
+            State::Optional(page) => {
+                let value = page.next().unwrap_or_default();
+                values.push(value);
+                validity.push(true);
+            },
+            State::Required(page) => {
+                let value = page.next().unwrap_or_default();
+                values.push(value);
+            },
+            State::RequiredDictionary(page) => {
+                let dict_values = &page.dict;
+                let item = page
+                    .values
+                    .next()
+                    .map(|index| dict_values[index.unwrap() as usize].as_ref())
+                    .unwrap_or_default();
+                values.push(item);
+            },
+            State::OptionalDictionary(page) => {
+                let dict_values = &page.dict;
+                let item = page
+                    .values
+                    .next()
+                    .map(|index| dict_values[index.unwrap() as usize].as_ref())
+                    .unwrap_or_default();
+                values.push(item);
+                validity.push(true);
+            },
+        }
+        Ok(())
+    }
+
+    fn push_null(&self, decoded: &mut Self::DecodedState) {
+        let (values, validity) = decoded;
+        values.push(&[]);
+        validity.push(false);
+    }
+
+    fn deserialize_dict(&self, page: &DictPage) -> Self::Dictionary {
+        deserialize_plain(&page.buffer, page.num_values)
+    }
+}
+
+pub struct NestedIter<O: Offset, I: Pages> {
+    iter: I,
+    data_type: DataType,
+    init: Vec<InitNested>,
+    items: VecDeque<(NestedState, (Binary<O>, MutableBitmap))>,
+    dict: Option<Dict>,
+    chunk_size: Option<usize>,
+    remaining: usize,
+}
+
+impl<O: Offset, I: Pages> NestedIter<O, I> {
+    pub fn new(
+        iter: I,
+        init: Vec<InitNested>,
+        data_type: DataType,
+        num_rows: usize,
+        chunk_size: Option<usize>,
+    ) -> Self {
+        Self {
+            iter,
+            data_type,
+            init,
+            items: VecDeque::new(),
+            dict: None,
+            chunk_size,
+            remaining: num_rows,
+        }
+    }
+}
+
+impl<O: Offset, I: Pages> Iterator for NestedIter<O, I> {
+    type Item = Result<(NestedState, Box<dyn Array>)>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        let maybe_state = next(
+            &mut self.iter,
+            &mut self.items,
+            &mut self.dict,
+            &mut self.remaining,
+            &self.init,
+            self.chunk_size,
+            &BinaryDecoder::<O>::default(),
+        );
+        match maybe_state {
+            MaybeNext::Some(Ok((nested, decoded))) => {
+                Some(finish(&self.data_type, decoded.0, decoded.1).map(|array| (nested, array)))
+            },
+            MaybeNext::Some(Err(e)) => Some(Err(e)),
+            MaybeNext::None => None,
+            MaybeNext::More => self.next(),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/binary/utils.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/binary/utils.rs
new file mode 100644
index 000000000000..0a2a0f3466f8
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/binary/utils.rs
@@ -0,0 +1,169 @@
+use super::super::utils::Pushable;
+use crate::offset::{Offset, Offsets};
+
+/// [`Pushable`] for variable length binary data.
+#[derive(Debug)]
+pub struct Binary<O: Offset> {
+    pub offsets: Offsets<O>,
+    pub values: Vec<u8>,
+}
+
+impl<O: Offset> Pushable<usize> for Offsets<O> {
+    fn reserve(&mut self, additional: usize) {
+        self.reserve(additional)
+    }
+    #[inline]
+    fn len(&self) -> usize {
+        self.len_proxy()
+    }
+
+    #[inline]
+    fn push(&mut self, value: usize) {
+        self.try_push_usize(value).unwrap()
+    }
+
+    #[inline]
+    fn push_null(&mut self) {
+        self.extend_constant(1);
+    }
+
+    #[inline]
+    fn extend_constant(&mut self, additional: usize, _: usize) {
+        self.extend_constant(additional)
+    }
+}
+
+impl<O: Offset> Binary<O> {
+    #[inline]
+    pub fn with_capacity(capacity: usize) -> Self {
+        Self {
+            offsets: Offsets::with_capacity(capacity),
+            values: Vec::with_capacity(capacity.min(100) * 24),
+        }
+    }
+
+    #[inline]
+    pub fn push(&mut self, v: &[u8]) {
+        if self.offsets.len_proxy() == 100 && self.offsets.capacity() > 100 {
+            let bytes_per_row = self.values.len() / 100 + 1;
+            let bytes_estimate = bytes_per_row * self.offsets.capacity();
+            if bytes_estimate > self.values.capacity() {
+                self.values.reserve(bytes_estimate - self.values.capacity());
+            }
+        }
+
+        self.values.extend(v);
+        self.offsets.try_push_usize(v.len()).unwrap()
+    }
+
+    #[inline]
+    pub fn extend_constant(&mut self, additional: usize) {
+        self.offsets.extend_constant(additional);
+    }
+
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.offsets.len_proxy()
+    }
+
+    #[inline]
+    pub fn extend_lengths<I: Iterator<Item = usize>>(&mut self, lengths: I, values: &mut &[u8]) {
+        let current_offset = *self.offsets.last();
+        self.offsets.try_extend_from_lengths(lengths).unwrap();
+        let new_offset = *self.offsets.last();
+        let length = new_offset.to_usize() - current_offset.to_usize();
+        let (consumed, remaining) = values.split_at(length);
+        *values = remaining;
+        self.values.extend_from_slice(consumed);
+    }
+}
+
+impl<'a, O: Offset> Pushable<&'a [u8]> for Binary<O> {
+    #[inline]
+    fn reserve(&mut self, additional: usize) {
+        let avg_len = self.values.len() / std::cmp::max(self.offsets.last().to_usize(), 1);
+        self.values.reserve(additional * avg_len);
+        self.offsets.reserve(additional);
+    }
+    #[inline]
+    fn len(&self) -> usize {
+        self.len()
+    }
+
+    #[inline]
+    fn push_null(&mut self) {
+        self.push(&[])
+    }
+
+    #[inline]
+    fn push(&mut self, value: &[u8]) {
+        self.push(value)
+    }
+
+    #[inline]
+    fn extend_constant(&mut self, additional: usize, value: &[u8]) {
+        assert_eq!(value.len(), 0);
+        self.extend_constant(additional)
+    }
+}
+
+#[derive(Debug)]
+pub struct BinaryIter<'a> {
+    values: &'a [u8],
+}
+
+impl<'a> BinaryIter<'a> {
+    pub fn new(values: &'a [u8]) -> Self {
+        Self { values }
+    }
+}
+
+impl<'a> Iterator for BinaryIter<'a> {
+    type Item = &'a [u8];
+
+    #[inline]
+    fn next(&mut self) -> Option<Self::Item> {
+        if self.values.is_empty() {
+            return None;
+        }
+        let (length, remaining) = self.values.split_at(4);
+        let length = u32::from_le_bytes(length.try_into().unwrap()) as usize;
+        let (result, remaining) = remaining.split_at(length);
+        self.values = remaining;
+        Some(result)
+    }
+}
+
+#[derive(Debug)]
+pub struct SizedBinaryIter<'a> {
+    iter: BinaryIter<'a>,
+    remaining: usize,
+}
+
+impl<'a> SizedBinaryIter<'a> {
+    pub fn new(values: &'a [u8], size: usize) -> Self {
+        let iter = BinaryIter::new(values);
+        Self {
+            iter,
+            remaining: size,
+        }
+    }
+}
+
+impl<'a> Iterator for SizedBinaryIter<'a> {
+    type Item = &'a [u8];
+
+    #[inline]
+    fn next(&mut self) -> Option<Self::Item> {
+        if self.remaining == 0 {
+            return None;
+        } else {
+            self.remaining -= 1
+        };
+        self.iter.next()
+    }
+
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        (self.remaining, Some(self.remaining))
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/boolean/basic.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/boolean/basic.rs
new file mode 100644
index 000000000000..dd3ac9eb52c5
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/boolean/basic.rs
@@ -0,0 +1,229 @@
+use std::collections::VecDeque;
+
+use parquet2::deserialize::SliceFilteredIter;
+use parquet2::encoding::Encoding;
+use parquet2::page::{split_buffer, DataPage, DictPage};
+use parquet2::schema::Repetition;
+
+use super::super::utils::{
+    extend_from_decoder, get_selected_rows, next, DecodedState, Decoder,
+    FilteredOptionalPageValidity, MaybeNext, OptionalPageValidity,
+};
+use super::super::{utils, Pages};
+use crate::array::BooleanArray;
+use crate::bitmap::utils::BitmapIter;
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::DataType;
+use crate::error::Result;
+
+#[derive(Debug)]
+struct Values<'a>(BitmapIter<'a>);
+
+impl<'a> Values<'a> {
+    pub fn try_new(page: &'a DataPage) -> Result<Self> {
+        let (_, _, values) = split_buffer(page)?;
+
+        Ok(Self(BitmapIter::new(values, 0, values.len() * 8)))
+    }
+}
+
+// The state of a required DataPage with a boolean physical type
+#[derive(Debug)]
+struct Required<'a> {
+    values: &'a [u8],
+    // invariant: offset <= length;
+    offset: usize,
+    length: usize,
+}
+
+impl<'a> Required<'a> {
+    pub fn new(page: &'a DataPage) -> Self {
+        Self {
+            values: page.buffer(),
+            offset: 0,
+            length: page.num_values(),
+        }
+    }
+}
+
+#[derive(Debug)]
+struct FilteredRequired<'a> {
+    values: SliceFilteredIter<BitmapIter<'a>>,
+}
+
+impl<'a> FilteredRequired<'a> {
+    pub fn try_new(page: &'a DataPage) -> Result<Self> {
+        let (_, _, values) = split_buffer(page)?;
+        // todo: replace this by an iterator over slices, for faster deserialization
+        let values = BitmapIter::new(values, 0, page.num_values());
+
+        let rows = get_selected_rows(page);
+        let values = SliceFilteredIter::new(values, rows);
+
+        Ok(Self { values })
+    }
+
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.values.size_hint().0
+    }
+}
+
+// The state of a `DataPage` of `Boolean` parquet boolean type
+#[derive(Debug)]
+enum State<'a> {
+    Optional(OptionalPageValidity<'a>, Values<'a>),
+    Required(Required<'a>),
+    FilteredRequired(FilteredRequired<'a>),
+    FilteredOptional(FilteredOptionalPageValidity<'a>, Values<'a>),
+}
+
+impl<'a> State<'a> {
+    pub fn len(&self) -> usize {
+        match self {
+            State::Optional(validity, _) => validity.len(),
+            State::Required(page) => page.length - page.offset,
+            State::FilteredRequired(page) => page.len(),
+            State::FilteredOptional(optional, _) => optional.len(),
+        }
+    }
+}
+
+impl<'a> utils::PageState<'a> for State<'a> {
+    fn len(&self) -> usize {
+        self.len()
+    }
+}
+
+impl DecodedState for (MutableBitmap, MutableBitmap) {
+    fn len(&self) -> usize {
+        self.0.len()
+    }
+}
+
+#[derive(Default)]
+struct BooleanDecoder {}
+
+impl<'a> Decoder<'a> for BooleanDecoder {
+    type State = State<'a>;
+    type Dict = ();
+    type DecodedState = (MutableBitmap, MutableBitmap);
+
+    fn build_state(&self, page: &'a DataPage, _: Option<&'a Self::Dict>) -> Result<Self::State> {
+        let is_optional =
+            page.descriptor.primitive_type.field_info.repetition == Repetition::Optional;
+        let is_filtered = page.selected_rows().is_some();
+
+        match (page.encoding(), is_optional, is_filtered) {
+            (Encoding::Plain, true, false) => Ok(State::Optional(
+                OptionalPageValidity::try_new(page)?,
+                Values::try_new(page)?,
+            )),
+            (Encoding::Plain, false, false) => Ok(State::Required(Required::new(page))),
+            (Encoding::Plain, true, true) => Ok(State::FilteredOptional(
+                FilteredOptionalPageValidity::try_new(page)?,
+                Values::try_new(page)?,
+            )),
+            (Encoding::Plain, false, true) => {
+                Ok(State::FilteredRequired(FilteredRequired::try_new(page)?))
+            },
+            _ => Err(utils::not_implemented(page)),
+        }
+    }
+
+    fn with_capacity(&self, capacity: usize) -> Self::DecodedState {
+        (
+            MutableBitmap::with_capacity(capacity),
+            MutableBitmap::with_capacity(capacity),
+        )
+    }
+
+    fn extend_from_state(
+        &self,
+        state: &mut Self::State,
+        decoded: &mut Self::DecodedState,
+        remaining: usize,
+    ) {
+        let (values, validity) = decoded;
+        match state {
+            State::Optional(page_validity, page_values) => extend_from_decoder(
+                validity,
+                page_validity,
+                Some(remaining),
+                values,
+                &mut page_values.0,
+            ),
+            State::Required(page) => {
+                let remaining = remaining.min(page.length - page.offset);
+                values.extend_from_slice(page.values, page.offset, remaining);
+                page.offset += remaining;
+            },
+            State::FilteredRequired(page) => {
+                values.reserve(remaining);
+                for item in page.values.by_ref().take(remaining) {
+                    values.push(item)
+                }
+            },
+            State::FilteredOptional(page_validity, page_values) => {
+                utils::extend_from_decoder(
+                    validity,
+                    page_validity,
+                    Some(remaining),
+                    values,
+                    page_values.0.by_ref(),
+                );
+            },
+        }
+    }
+
+    fn deserialize_dict(&self, _: &DictPage) -> Self::Dict {}
+}
+
+fn finish(data_type: &DataType, values: MutableBitmap, validity: MutableBitmap) -> BooleanArray {
+    BooleanArray::new(data_type.clone(), values.into(), validity.into())
+}
+
+/// An iterator adapter over [`Pages`] assumed to be encoded as boolean arrays
+#[derive(Debug)]
+pub struct Iter<I: Pages> {
+    iter: I,
+    data_type: DataType,
+    items: VecDeque<(MutableBitmap, MutableBitmap)>,
+    chunk_size: Option<usize>,
+    remaining: usize,
+}
+
+impl<I: Pages> Iter<I> {
+    pub fn new(iter: I, data_type: DataType, chunk_size: Option<usize>, num_rows: usize) -> Self {
+        Self {
+            iter,
+            data_type,
+            items: VecDeque::new(),
+            chunk_size,
+            remaining: num_rows,
+        }
+    }
+}
+
+impl<I: Pages> Iterator for Iter<I> {
+    type Item = Result<BooleanArray>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        let maybe_state = next(
+            &mut self.iter,
+            &mut self.items,
+            &mut None,
+            &mut self.remaining,
+            self.chunk_size,
+            &BooleanDecoder::default(),
+        );
+        match maybe_state {
+            MaybeNext::Some(Ok((values, validity))) => {
+                Some(Ok(finish(&self.data_type, values, validity)))
+            },
+            MaybeNext::Some(Err(e)) => Some(Err(e)),
+            MaybeNext::None => None,
+            MaybeNext::More => self.next(),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/boolean/mod.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/boolean/mod.rs
new file mode 100644
index 000000000000..dc00cc2a4249
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/boolean/mod.rs
@@ -0,0 +1,6 @@
+mod basic;
+mod nested;
+
+pub use nested::NestedIter;
+
+pub use self::basic::Iter;
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/boolean/nested.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/boolean/nested.rs
new file mode 100644
index 000000000000..f3e684ab9fe3
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/boolean/nested.rs
@@ -0,0 +1,153 @@
+use std::collections::VecDeque;
+
+use parquet2::encoding::Encoding;
+use parquet2::page::{split_buffer, DataPage, DictPage};
+use parquet2::schema::Repetition;
+
+use super::super::nested_utils::*;
+use super::super::utils::MaybeNext;
+use super::super::{utils, Pages};
+use crate::array::BooleanArray;
+use crate::bitmap::utils::BitmapIter;
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::DataType;
+use crate::error::Result;
+
+// The state of a `DataPage` of `Boolean` parquet boolean type
+#[allow(clippy::large_enum_variant)]
+#[derive(Debug)]
+enum State<'a> {
+    Optional(BitmapIter<'a>),
+    Required(BitmapIter<'a>),
+}
+
+impl<'a> State<'a> {
+    pub fn len(&self) -> usize {
+        match self {
+            State::Optional(iter) => iter.size_hint().0,
+            State::Required(iter) => iter.size_hint().0,
+        }
+    }
+}
+
+impl<'a> utils::PageState<'a> for State<'a> {
+    fn len(&self) -> usize {
+        self.len()
+    }
+}
+
+#[derive(Default)]
+struct BooleanDecoder {}
+
+impl<'a> NestedDecoder<'a> for BooleanDecoder {
+    type State = State<'a>;
+    type Dictionary = ();
+    type DecodedState = (MutableBitmap, MutableBitmap);
+
+    fn build_state(
+        &self,
+        page: &'a DataPage,
+        _: Option<&'a Self::Dictionary>,
+    ) -> Result<Self::State> {
+        let is_optional =
+            page.descriptor.primitive_type.field_info.repetition == Repetition::Optional;
+        let is_filtered = page.selected_rows().is_some();
+
+        match (page.encoding(), is_optional, is_filtered) {
+            (Encoding::Plain, true, false) => {
+                let (_, _, values) = split_buffer(page)?;
+                let values = BitmapIter::new(values, 0, values.len() * 8);
+
+                Ok(State::Optional(values))
+            },
+            (Encoding::Plain, false, false) => {
+                let (_, _, values) = split_buffer(page)?;
+                let values = BitmapIter::new(values, 0, values.len() * 8);
+
+                Ok(State::Required(values))
+            },
+            _ => Err(utils::not_implemented(page)),
+        }
+    }
+
+    fn with_capacity(&self, capacity: usize) -> Self::DecodedState {
+        (
+            MutableBitmap::with_capacity(capacity),
+            MutableBitmap::with_capacity(capacity),
+        )
+    }
+
+    fn push_valid(&self, state: &mut State, decoded: &mut Self::DecodedState) -> Result<()> {
+        let (values, validity) = decoded;
+        match state {
+            State::Optional(page_values) => {
+                let value = page_values.next().unwrap_or_default();
+                values.push(value);
+                validity.push(true);
+            },
+            State::Required(page_values) => {
+                let value = page_values.next().unwrap_or_default();
+                values.push(value);
+            },
+        }
+        Ok(())
+    }
+
+    fn push_null(&self, decoded: &mut Self::DecodedState) {
+        let (values, validity) = decoded;
+        values.push(false);
+        validity.push(false);
+    }
+
+    fn deserialize_dict(&self, _: &DictPage) -> Self::Dictionary {}
+}
+
+/// An iterator adapter over [`Pages`] assumed to be encoded as boolean arrays
+#[derive(Debug)]
+pub struct NestedIter<I: Pages> {
+    iter: I,
+    init: Vec<InitNested>,
+    items: VecDeque<(NestedState, (MutableBitmap, MutableBitmap))>,
+    remaining: usize,
+    chunk_size: Option<usize>,
+}
+
+impl<I: Pages> NestedIter<I> {
+    pub fn new(iter: I, init: Vec<InitNested>, num_rows: usize, chunk_size: Option<usize>) -> Self {
+        Self {
+            iter,
+            init,
+            items: VecDeque::new(),
+            remaining: num_rows,
+            chunk_size,
+        }
+    }
+}
+
+fn finish(data_type: &DataType, values: MutableBitmap, validity: MutableBitmap) -> BooleanArray {
+    BooleanArray::new(data_type.clone(), values.into(), validity.into())
+}
+
+impl<I: Pages> Iterator for NestedIter<I> {
+    type Item = Result<(NestedState, BooleanArray)>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        let maybe_state = next(
+            &mut self.iter,
+            &mut self.items,
+            &mut None,
+            &mut self.remaining,
+            &self.init,
+            self.chunk_size,
+            &BooleanDecoder::default(),
+        );
+        match maybe_state {
+            MaybeNext::Some(Ok((nested, (values, validity)))) => {
+                Some(Ok((nested, finish(&DataType::Boolean, values, validity))))
+            },
+            MaybeNext::Some(Err(e)) => Some(Err(e)),
+            MaybeNext::None => None,
+            MaybeNext::More => self.next(),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/dictionary/mod.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/dictionary/mod.rs
new file mode 100644
index 000000000000..7826f5856c0e
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/dictionary/mod.rs
@@ -0,0 +1,314 @@
+mod nested;
+
+use std::collections::VecDeque;
+
+use parquet2::deserialize::SliceFilteredIter;
+use parquet2::encoding::hybrid_rle::HybridRleDecoder;
+use parquet2::encoding::Encoding;
+use parquet2::page::{DataPage, DictPage, Page};
+use parquet2::schema::Repetition;
+
+use super::utils::{
+    self, dict_indices_decoder, extend_from_decoder, get_selected_rows, DecodedState, Decoder,
+    FilteredOptionalPageValidity, MaybeNext, OptionalPageValidity,
+};
+use super::Pages;
+use crate::array::{Array, DictionaryArray, DictionaryKey, PrimitiveArray};
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+
+// The state of a `DataPage` of `Primitive` parquet primitive type
+#[derive(Debug)]
+pub enum State<'a> {
+    Optional(Optional<'a>),
+    Required(Required<'a>),
+    FilteredRequired(FilteredRequired<'a>),
+    FilteredOptional(FilteredOptionalPageValidity<'a>, HybridRleDecoder<'a>),
+}
+
+#[derive(Debug)]
+pub struct Required<'a> {
+    values: HybridRleDecoder<'a>,
+}
+
+impl<'a> Required<'a> {
+    fn try_new(page: &'a DataPage) -> Result<Self> {
+        let values = dict_indices_decoder(page)?;
+        Ok(Self { values })
+    }
+}
+
+#[derive(Debug)]
+pub struct FilteredRequired<'a> {
+    values: SliceFilteredIter<HybridRleDecoder<'a>>,
+}
+
+impl<'a> FilteredRequired<'a> {
+    fn try_new(page: &'a DataPage) -> Result<Self> {
+        let values = dict_indices_decoder(page)?;
+
+        let rows = get_selected_rows(page);
+        let values = SliceFilteredIter::new(values, rows);
+
+        Ok(Self { values })
+    }
+}
+
+#[derive(Debug)]
+pub struct Optional<'a> {
+    values: HybridRleDecoder<'a>,
+    validity: OptionalPageValidity<'a>,
+}
+
+impl<'a> Optional<'a> {
+    fn try_new(page: &'a DataPage) -> Result<Self> {
+        let values = dict_indices_decoder(page)?;
+
+        Ok(Self {
+            values,
+            validity: OptionalPageValidity::try_new(page)?,
+        })
+    }
+}
+
+impl<'a> utils::PageState<'a> for State<'a> {
+    fn len(&self) -> usize {
+        match self {
+            State::Optional(optional) => optional.validity.len(),
+            State::Required(required) => required.values.size_hint().0,
+            State::FilteredRequired(required) => required.values.size_hint().0,
+            State::FilteredOptional(validity, _) => validity.len(),
+        }
+    }
+}
+
+#[derive(Debug)]
+pub struct PrimitiveDecoder<K>
+where
+    K: DictionaryKey,
+{
+    phantom_k: std::marker::PhantomData<K>,
+}
+
+impl<K> Default for PrimitiveDecoder<K>
+where
+    K: DictionaryKey,
+{
+    #[inline]
+    fn default() -> Self {
+        Self {
+            phantom_k: std::marker::PhantomData,
+        }
+    }
+}
+
+impl<'a, K> utils::Decoder<'a> for PrimitiveDecoder<K>
+where
+    K: DictionaryKey,
+{
+    type State = State<'a>;
+    type Dict = ();
+    type DecodedState = (Vec<K>, MutableBitmap);
+
+    fn build_state(&self, page: &'a DataPage, _: Option<&'a Self::Dict>) -> Result<Self::State> {
+        let is_optional =
+            page.descriptor.primitive_type.field_info.repetition == Repetition::Optional;
+        let is_filtered = page.selected_rows().is_some();
+
+        match (page.encoding(), is_optional, is_filtered) {
+            (Encoding::PlainDictionary | Encoding::RleDictionary, false, false) => {
+                Required::try_new(page).map(State::Required)
+            },
+            (Encoding::PlainDictionary | Encoding::RleDictionary, true, false) => {
+                Optional::try_new(page).map(State::Optional)
+            },
+            (Encoding::PlainDictionary | Encoding::RleDictionary, false, true) => {
+                FilteredRequired::try_new(page).map(State::FilteredRequired)
+            },
+            (Encoding::PlainDictionary | Encoding::RleDictionary, true, true) => {
+                Ok(State::FilteredOptional(
+                    FilteredOptionalPageValidity::try_new(page)?,
+                    dict_indices_decoder(page)?,
+                ))
+            },
+            _ => Err(utils::not_implemented(page)),
+        }
+    }
+
+    fn with_capacity(&self, capacity: usize) -> Self::DecodedState {
+        (
+            Vec::<K>::with_capacity(capacity),
+            MutableBitmap::with_capacity(capacity),
+        )
+    }
+
+    fn extend_from_state(
+        &self,
+        state: &mut Self::State,
+        decoded: &mut Self::DecodedState,
+        remaining: usize,
+    ) {
+        let (values, validity) = decoded;
+        match state {
+            State::Optional(page) => extend_from_decoder(
+                validity,
+                &mut page.validity,
+                Some(remaining),
+                values,
+                &mut page.values.by_ref().map(|x| {
+                    // todo: rm unwrap
+                    let x: usize = x.unwrap().try_into().unwrap();
+                    match x.try_into() {
+                        Ok(key) => key,
+                        // todo: convert this to an error.
+                        Err(_) => panic!("The maximum key is too small"),
+                    }
+                }),
+            ),
+            State::Required(page) => {
+                values.extend(
+                    page.values
+                        .by_ref()
+                        .map(|x| {
+                            // todo: rm unwrap
+                            let x: usize = x.unwrap().try_into().unwrap();
+                            let x: K = match x.try_into() {
+                                Ok(key) => key,
+                                // todo: convert this to an error.
+                                Err(_) => {
+                                    panic!("The maximum key is too small")
+                                },
+                            };
+                            x
+                        })
+                        .take(remaining),
+                );
+            },
+            State::FilteredOptional(page_validity, page_values) => extend_from_decoder(
+                validity,
+                page_validity,
+                Some(remaining),
+                values,
+                &mut page_values.by_ref().map(|x| {
+                    // todo: rm unwrap
+                    let x: usize = x.unwrap().try_into().unwrap();
+                    let x: K = match x.try_into() {
+                        Ok(key) => key,
+                        // todo: convert this to an error.
+                        Err(_) => {
+                            panic!("The maximum key is too small")
+                        },
+                    };
+                    x
+                }),
+            ),
+            State::FilteredRequired(page) => {
+                values.extend(
+                    page.values
+                        .by_ref()
+                        .map(|x| {
+                            // todo: rm unwrap
+                            let x: usize = x.unwrap().try_into().unwrap();
+                            let x: K = match x.try_into() {
+                                Ok(key) => key,
+                                // todo: convert this to an error.
+                                Err(_) => {
+                                    panic!("The maximum key is too small")
+                                },
+                            };
+                            x
+                        })
+                        .take(remaining),
+                );
+            },
+        }
+    }
+
+    fn deserialize_dict(&self, _: &DictPage) -> Self::Dict {}
+}
+
+fn finish_key<K: DictionaryKey>(values: Vec<K>, validity: MutableBitmap) -> PrimitiveArray<K> {
+    PrimitiveArray::new(K::PRIMITIVE.into(), values.into(), validity.into())
+}
+
+#[inline]
+pub(super) fn next_dict<K: DictionaryKey, I: Pages, F: Fn(&DictPage) -> Box<dyn Array>>(
+    iter: &mut I,
+    items: &mut VecDeque<(Vec<K>, MutableBitmap)>,
+    dict: &mut Option<Box<dyn Array>>,
+    data_type: DataType,
+    remaining: &mut usize,
+    chunk_size: Option<usize>,
+    read_dict: F,
+) -> MaybeNext<Result<DictionaryArray<K>>> {
+    if items.len() > 1 {
+        let (values, validity) = items.pop_front().unwrap();
+        let keys = finish_key(values, validity);
+        return MaybeNext::Some(DictionaryArray::try_new(
+            data_type,
+            keys,
+            dict.clone().unwrap(),
+        ));
+    }
+    match iter.next() {
+        Err(e) => MaybeNext::Some(Err(e.into())),
+        Ok(Some(page)) => {
+            let (page, dict) = match (&dict, page) {
+                (None, Page::Data(_)) => {
+                    return MaybeNext::Some(Err(Error::nyi(
+                        "dictionary arrays from non-dict-encoded pages",
+                    )));
+                },
+                (_, Page::Dict(dict_page)) => {
+                    *dict = Some(read_dict(dict_page));
+                    return next_dict(
+                        iter, items, dict, data_type, remaining, chunk_size, read_dict,
+                    );
+                },
+                (Some(dict), Page::Data(page)) => (page, dict),
+            };
+
+            // there is a new page => consume the page from the start
+            let maybe_page = PrimitiveDecoder::<K>::default().build_state(page, None);
+            let page = match maybe_page {
+                Ok(page) => page,
+                Err(e) => return MaybeNext::Some(Err(e)),
+            };
+
+            utils::extend_from_new_page(
+                page,
+                chunk_size,
+                items,
+                remaining,
+                &PrimitiveDecoder::<K>::default(),
+            );
+
+            if items.front().unwrap().len() < chunk_size.unwrap_or(usize::MAX) {
+                MaybeNext::More
+            } else {
+                let (values, validity) = items.pop_front().unwrap();
+                let keys = finish_key(values, validity);
+                MaybeNext::Some(DictionaryArray::try_new(data_type, keys, dict.clone()))
+            }
+        },
+        Ok(None) => {
+            if let Some((values, validity)) = items.pop_front() {
+                // we have a populated item and no more pages
+                // the only case where an item's length may be smaller than chunk_size
+                debug_assert!(values.len() <= chunk_size.unwrap_or(usize::MAX));
+
+                let keys = finish_key(values, validity);
+                MaybeNext::Some(DictionaryArray::try_new(
+                    data_type,
+                    keys,
+                    dict.clone().unwrap(),
+                ))
+            } else {
+                MaybeNext::None
+            }
+        },
+    }
+}
+
+pub use nested::next_dict as nested_next_dict;
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/dictionary/nested.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/dictionary/nested.rs
new file mode 100644
index 000000000000..1fb1919d1504
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/dictionary/nested.rs
@@ -0,0 +1,213 @@
+use std::collections::VecDeque;
+
+use parquet2::encoding::hybrid_rle::HybridRleDecoder;
+use parquet2::encoding::Encoding;
+use parquet2::page::{DataPage, DictPage, Page};
+use parquet2::schema::Repetition;
+
+use super::super::super::Pages;
+use super::super::nested_utils::*;
+use super::super::utils::{dict_indices_decoder, not_implemented, MaybeNext, PageState};
+use super::finish_key;
+use crate::array::{Array, DictionaryArray, DictionaryKey};
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+
+// The state of a required DataPage with a boolean physical type
+#[derive(Debug)]
+pub struct Required<'a> {
+    values: HybridRleDecoder<'a>,
+    length: usize,
+}
+
+impl<'a> Required<'a> {
+    fn try_new(page: &'a DataPage) -> Result<Self> {
+        let values = dict_indices_decoder(page)?;
+        let length = page.num_values();
+        Ok(Self { values, length })
+    }
+}
+
+// The state of a `DataPage` of a `Dictionary` type
+#[allow(clippy::large_enum_variant)]
+#[derive(Debug)]
+pub enum State<'a> {
+    Optional(HybridRleDecoder<'a>),
+    Required(Required<'a>),
+}
+
+impl<'a> State<'a> {
+    pub fn len(&self) -> usize {
+        match self {
+            State::Optional(page) => page.len(),
+            State::Required(page) => page.length,
+        }
+    }
+}
+
+impl<'a> PageState<'a> for State<'a> {
+    fn len(&self) -> usize {
+        self.len()
+    }
+}
+
+#[derive(Debug)]
+pub struct DictionaryDecoder<K>
+where
+    K: DictionaryKey,
+{
+    phantom_k: std::marker::PhantomData<K>,
+}
+
+impl<K> Default for DictionaryDecoder<K>
+where
+    K: DictionaryKey,
+{
+    #[inline]
+    fn default() -> Self {
+        Self {
+            phantom_k: std::marker::PhantomData,
+        }
+    }
+}
+
+impl<'a, K: DictionaryKey> NestedDecoder<'a> for DictionaryDecoder<K> {
+    type State = State<'a>;
+    type Dictionary = ();
+    type DecodedState = (Vec<K>, MutableBitmap);
+
+    fn build_state(
+        &self,
+        page: &'a DataPage,
+        _: Option<&'a Self::Dictionary>,
+    ) -> Result<Self::State> {
+        let is_optional =
+            page.descriptor.primitive_type.field_info.repetition == Repetition::Optional;
+        let is_filtered = page.selected_rows().is_some();
+
+        match (page.encoding(), is_optional, is_filtered) {
+            (Encoding::RleDictionary | Encoding::PlainDictionary, true, false) => {
+                dict_indices_decoder(page).map(State::Optional)
+            },
+            (Encoding::RleDictionary | Encoding::PlainDictionary, false, false) => {
+                Required::try_new(page).map(State::Required)
+            },
+            _ => Err(not_implemented(page)),
+        }
+    }
+
+    fn with_capacity(&self, capacity: usize) -> Self::DecodedState {
+        (
+            Vec::with_capacity(capacity),
+            MutableBitmap::with_capacity(capacity),
+        )
+    }
+
+    fn push_valid(&self, state: &mut Self::State, decoded: &mut Self::DecodedState) -> Result<()> {
+        let (values, validity) = decoded;
+        match state {
+            State::Optional(page_values) => {
+                let key = page_values.next().transpose()?;
+                // todo: convert unwrap to error
+                let key = match K::try_from(key.unwrap_or_default() as usize) {
+                    Ok(key) => key,
+                    Err(_) => todo!(),
+                };
+                values.push(key);
+                validity.push(true);
+            },
+            State::Required(page_values) => {
+                let key = page_values.values.next().transpose()?;
+                let key = match K::try_from(key.unwrap_or_default() as usize) {
+                    Ok(key) => key,
+                    Err(_) => todo!(),
+                };
+                values.push(key);
+            },
+        }
+        Ok(())
+    }
+
+    fn push_null(&self, decoded: &mut Self::DecodedState) {
+        let (values, validity) = decoded;
+        values.push(K::default());
+        validity.push(false)
+    }
+
+    fn deserialize_dict(&self, _: &DictPage) -> Self::Dictionary {}
+}
+
+#[allow(clippy::too_many_arguments)]
+pub fn next_dict<K: DictionaryKey, I: Pages, F: Fn(&DictPage) -> Box<dyn Array>>(
+    iter: &mut I,
+    items: &mut VecDeque<(NestedState, (Vec<K>, MutableBitmap))>,
+    remaining: &mut usize,
+    init: &[InitNested],
+    dict: &mut Option<Box<dyn Array>>,
+    data_type: DataType,
+    chunk_size: Option<usize>,
+    read_dict: F,
+) -> MaybeNext<Result<(NestedState, DictionaryArray<K>)>> {
+    if items.len() > 1 {
+        let (nested, (values, validity)) = items.pop_front().unwrap();
+        let keys = finish_key(values, validity);
+        let dict = DictionaryArray::try_new(data_type, keys, dict.clone().unwrap());
+        return MaybeNext::Some(dict.map(|dict| (nested, dict)));
+    }
+    match iter.next() {
+        Err(e) => MaybeNext::Some(Err(e.into())),
+        Ok(Some(page)) => {
+            let (page, dict) = match (&dict, page) {
+                (None, Page::Data(_)) => {
+                    return MaybeNext::Some(Err(Error::nyi(
+                        "dictionary arrays from non-dict-encoded pages",
+                    )));
+                },
+                (_, Page::Dict(dict_page)) => {
+                    *dict = Some(read_dict(dict_page));
+                    return next_dict(
+                        iter, items, remaining, init, dict, data_type, chunk_size, read_dict,
+                    );
+                },
+                (Some(dict), Page::Data(page)) => (page, dict),
+            };
+
+            let error = extend(
+                page,
+                init,
+                items,
+                None,
+                remaining,
+                &DictionaryDecoder::<K>::default(),
+                chunk_size,
+            );
+            match error {
+                Ok(_) => {},
+                Err(e) => return MaybeNext::Some(Err(e)),
+            };
+
+            if items.front().unwrap().0.len() < chunk_size.unwrap_or(usize::MAX) {
+                MaybeNext::More
+            } else {
+                let (nested, (values, validity)) = items.pop_front().unwrap();
+                let keys = finish_key(values, validity);
+                let dict = DictionaryArray::try_new(data_type, keys, dict.clone());
+                MaybeNext::Some(dict.map(|dict| (nested, dict)))
+            }
+        },
+        Ok(None) => {
+            if let Some((nested, (values, validity))) = items.pop_front() {
+                // we have a populated item and no more pages
+                // the only case where an item's length may be smaller than chunk_size
+                debug_assert!(values.len() <= chunk_size.unwrap_or(usize::MAX));
+
+                let keys = finish_key(values, validity);
+                let dict = DictionaryArray::try_new(data_type, keys, dict.clone().unwrap());
+                MaybeNext::Some(dict.map(|dict| (nested, dict)))
+            } else {
+                MaybeNext::None
+            }
+        },
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/fixed_size_binary/basic.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/fixed_size_binary/basic.rs
new file mode 100644
index 000000000000..aee3116ed64e
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/fixed_size_binary/basic.rs
@@ -0,0 +1,322 @@
+use std::collections::VecDeque;
+
+use parquet2::deserialize::SliceFilteredIter;
+use parquet2::encoding::{hybrid_rle, Encoding};
+use parquet2::page::{split_buffer, DataPage, DictPage};
+use parquet2::schema::Repetition;
+
+use super::super::utils::{
+    dict_indices_decoder, extend_from_decoder, get_selected_rows, next, not_implemented,
+    DecodedState, Decoder, FilteredOptionalPageValidity, MaybeNext, OptionalPageValidity,
+    PageState, Pushable,
+};
+use super::super::Pages;
+use super::utils::FixedSizeBinary;
+use crate::array::FixedSizeBinaryArray;
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::DataType;
+use crate::error::Result;
+
+pub(super) type Dict = Vec<u8>;
+
+#[derive(Debug)]
+pub(super) struct Optional<'a> {
+    pub(super) values: std::slice::ChunksExact<'a, u8>,
+    pub(super) validity: OptionalPageValidity<'a>,
+}
+
+impl<'a> Optional<'a> {
+    pub(super) fn try_new(page: &'a DataPage, size: usize) -> Result<Self> {
+        let (_, _, values) = split_buffer(page)?;
+
+        let values = values.chunks_exact(size);
+
+        Ok(Self {
+            values,
+            validity: OptionalPageValidity::try_new(page)?,
+        })
+    }
+}
+
+#[derive(Debug)]
+pub(super) struct Required<'a> {
+    pub values: std::slice::ChunksExact<'a, u8>,
+}
+
+impl<'a> Required<'a> {
+    pub(super) fn new(page: &'a DataPage, size: usize) -> Self {
+        let values = page.buffer();
+        assert_eq!(values.len() % size, 0);
+        let values = values.chunks_exact(size);
+        Self { values }
+    }
+
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.values.size_hint().0
+    }
+}
+
+#[derive(Debug)]
+pub(super) struct FilteredRequired<'a> {
+    pub values: SliceFilteredIter<std::slice::ChunksExact<'a, u8>>,
+}
+
+impl<'a> FilteredRequired<'a> {
+    fn new(page: &'a DataPage, size: usize) -> Self {
+        let values = page.buffer();
+        assert_eq!(values.len() % size, 0);
+        let values = values.chunks_exact(size);
+
+        let rows = get_selected_rows(page);
+        let values = SliceFilteredIter::new(values, rows);
+
+        Self { values }
+    }
+
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.values.size_hint().0
+    }
+}
+
+#[derive(Debug)]
+pub(super) struct RequiredDictionary<'a> {
+    pub values: hybrid_rle::HybridRleDecoder<'a>,
+    pub dict: &'a Dict,
+}
+
+impl<'a> RequiredDictionary<'a> {
+    pub(super) fn try_new(page: &'a DataPage, dict: &'a Dict) -> Result<Self> {
+        let values = dict_indices_decoder(page)?;
+
+        Ok(Self { dict, values })
+    }
+
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.values.size_hint().0
+    }
+}
+
+#[derive(Debug)]
+pub(super) struct OptionalDictionary<'a> {
+    pub(super) values: hybrid_rle::HybridRleDecoder<'a>,
+    pub(super) validity: OptionalPageValidity<'a>,
+    pub(super) dict: &'a Dict,
+}
+
+impl<'a> OptionalDictionary<'a> {
+    pub(super) fn try_new(page: &'a DataPage, dict: &'a Dict) -> Result<Self> {
+        let values = dict_indices_decoder(page)?;
+
+        Ok(Self {
+            values,
+            validity: OptionalPageValidity::try_new(page)?,
+            dict,
+        })
+    }
+}
+
+#[derive(Debug)]
+enum State<'a> {
+    Optional(Optional<'a>),
+    Required(Required<'a>),
+    RequiredDictionary(RequiredDictionary<'a>),
+    OptionalDictionary(OptionalDictionary<'a>),
+    FilteredRequired(FilteredRequired<'a>),
+    FilteredOptional(
+        FilteredOptionalPageValidity<'a>,
+        std::slice::ChunksExact<'a, u8>,
+    ),
+}
+
+impl<'a> PageState<'a> for State<'a> {
+    fn len(&self) -> usize {
+        match self {
+            State::Optional(state) => state.validity.len(),
+            State::Required(state) => state.len(),
+            State::RequiredDictionary(state) => state.len(),
+            State::OptionalDictionary(state) => state.validity.len(),
+            State::FilteredRequired(state) => state.len(),
+            State::FilteredOptional(state, _) => state.len(),
+        }
+    }
+}
+
+struct BinaryDecoder {
+    size: usize,
+}
+
+impl DecodedState for (FixedSizeBinary, MutableBitmap) {
+    fn len(&self) -> usize {
+        self.0.len()
+    }
+}
+
+impl<'a> Decoder<'a> for BinaryDecoder {
+    type State = State<'a>;
+    type Dict = Dict;
+    type DecodedState = (FixedSizeBinary, MutableBitmap);
+
+    fn build_state(&self, page: &'a DataPage, dict: Option<&'a Self::Dict>) -> Result<Self::State> {
+        let is_optional =
+            page.descriptor.primitive_type.field_info.repetition == Repetition::Optional;
+        let is_filtered = page.selected_rows().is_some();
+
+        match (page.encoding(), dict, is_optional, is_filtered) {
+            (Encoding::Plain, _, true, false) => {
+                Ok(State::Optional(Optional::try_new(page, self.size)?))
+            },
+            (Encoding::Plain, _, false, false) => {
+                Ok(State::Required(Required::new(page, self.size)))
+            },
+            (Encoding::PlainDictionary | Encoding::RleDictionary, Some(dict), false, false) => {
+                RequiredDictionary::try_new(page, dict).map(State::RequiredDictionary)
+            },
+            (Encoding::PlainDictionary | Encoding::RleDictionary, Some(dict), true, false) => {
+                OptionalDictionary::try_new(page, dict).map(State::OptionalDictionary)
+            },
+            (Encoding::Plain, None, false, true) => Ok(State::FilteredRequired(
+                FilteredRequired::new(page, self.size),
+            )),
+            (Encoding::Plain, _, true, true) => {
+                let (_, _, values) = split_buffer(page)?;
+
+                Ok(State::FilteredOptional(
+                    FilteredOptionalPageValidity::try_new(page)?,
+                    values.chunks_exact(self.size),
+                ))
+            },
+            _ => Err(not_implemented(page)),
+        }
+    }
+
+    fn with_capacity(&self, capacity: usize) -> Self::DecodedState {
+        (
+            FixedSizeBinary::with_capacity(capacity, self.size),
+            MutableBitmap::with_capacity(capacity),
+        )
+    }
+
+    fn extend_from_state(
+        &self,
+        state: &mut Self::State,
+        decoded: &mut Self::DecodedState,
+
+        remaining: usize,
+    ) {
+        let (values, validity) = decoded;
+        match state {
+            State::Optional(page) => extend_from_decoder(
+                validity,
+                &mut page.validity,
+                Some(remaining),
+                values,
+                &mut page.values,
+            ),
+            State::Required(page) => {
+                for x in page.values.by_ref().take(remaining) {
+                    values.push(x)
+                }
+            },
+            State::FilteredRequired(page) => {
+                for x in page.values.by_ref().take(remaining) {
+                    values.push(x)
+                }
+            },
+            State::OptionalDictionary(page) => extend_from_decoder(
+                validity,
+                &mut page.validity,
+                Some(remaining),
+                values,
+                page.values.by_ref().map(|index| {
+                    let index = index.unwrap() as usize;
+                    &page.dict[index * self.size..(index + 1) * self.size]
+                }),
+            ),
+            State::RequiredDictionary(page) => {
+                for x in page
+                    .values
+                    .by_ref()
+                    .map(|index| {
+                        let index = index.unwrap() as usize;
+                        &page.dict[index * self.size..(index + 1) * self.size]
+                    })
+                    .take(remaining)
+                {
+                    values.push(x)
+                }
+            },
+            State::FilteredOptional(page_validity, page_values) => {
+                extend_from_decoder(
+                    validity,
+                    page_validity,
+                    Some(remaining),
+                    values,
+                    page_values.by_ref(),
+                );
+            },
+        }
+    }
+
+    fn deserialize_dict(&self, page: &DictPage) -> Self::Dict {
+        page.buffer.clone()
+    }
+}
+
+pub fn finish(
+    data_type: &DataType,
+    values: FixedSizeBinary,
+    validity: MutableBitmap,
+) -> FixedSizeBinaryArray {
+    FixedSizeBinaryArray::new(data_type.clone(), values.values.into(), validity.into())
+}
+
+pub struct Iter<I: Pages> {
+    iter: I,
+    data_type: DataType,
+    size: usize,
+    items: VecDeque<(FixedSizeBinary, MutableBitmap)>,
+    dict: Option<Dict>,
+    chunk_size: Option<usize>,
+    remaining: usize,
+}
+
+impl<I: Pages> Iter<I> {
+    pub fn new(iter: I, data_type: DataType, num_rows: usize, chunk_size: Option<usize>) -> Self {
+        let size = FixedSizeBinaryArray::get_size(&data_type);
+        Self {
+            iter,
+            data_type,
+            size,
+            items: VecDeque::new(),
+            dict: None,
+            chunk_size,
+            remaining: num_rows,
+        }
+    }
+}
+
+impl<I: Pages> Iterator for Iter<I> {
+    type Item = Result<FixedSizeBinaryArray>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        let maybe_state = next(
+            &mut self.iter,
+            &mut self.items,
+            &mut self.dict,
+            &mut self.remaining,
+            self.chunk_size,
+            &BinaryDecoder { size: self.size },
+        );
+        match maybe_state {
+            MaybeNext::Some(Ok((values, validity))) => {
+                Some(Ok(finish(&self.data_type, values, validity)))
+            },
+            MaybeNext::Some(Err(e)) => Some(Err(e)),
+            MaybeNext::None => None,
+            MaybeNext::More => self.next(),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/fixed_size_binary/dictionary.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/fixed_size_binary/dictionary.rs
new file mode 100644
index 000000000000..3f5455b0bdb8
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/fixed_size_binary/dictionary.rs
@@ -0,0 +1,150 @@
+use std::collections::VecDeque;
+
+use parquet2::page::DictPage;
+
+use super::super::dictionary::*;
+use super::super::utils::MaybeNext;
+use super::super::Pages;
+use crate::array::{Array, DictionaryArray, DictionaryKey, FixedSizeBinaryArray};
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::DataType;
+use crate::error::Result;
+use crate::io::parquet::read::deserialize::nested_utils::{InitNested, NestedState};
+
+/// An iterator adapter over [`Pages`] assumed to be encoded as parquet's dictionary-encoded binary representation
+#[derive(Debug)]
+pub struct DictIter<K, I>
+where
+    I: Pages,
+    K: DictionaryKey,
+{
+    iter: I,
+    data_type: DataType,
+    values: Option<Box<dyn Array>>,
+    items: VecDeque<(Vec<K>, MutableBitmap)>,
+    remaining: usize,
+    chunk_size: Option<usize>,
+}
+
+impl<K, I> DictIter<K, I>
+where
+    K: DictionaryKey,
+    I: Pages,
+{
+    pub fn new(iter: I, data_type: DataType, num_rows: usize, chunk_size: Option<usize>) -> Self {
+        Self {
+            iter,
+            data_type,
+            values: None,
+            items: VecDeque::new(),
+            remaining: num_rows,
+            chunk_size,
+        }
+    }
+}
+
+fn read_dict(data_type: DataType, dict: &DictPage) -> Box<dyn Array> {
+    let data_type = match data_type {
+        DataType::Dictionary(_, values, _) => *values,
+        _ => data_type,
+    };
+
+    let values = dict.buffer.clone();
+
+    FixedSizeBinaryArray::try_new(data_type, values.into(), None)
+        .unwrap()
+        .boxed()
+}
+
+impl<K, I> Iterator for DictIter<K, I>
+where
+    I: Pages,
+    K: DictionaryKey,
+{
+    type Item = Result<DictionaryArray<K>>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        let maybe_state = next_dict(
+            &mut self.iter,
+            &mut self.items,
+            &mut self.values,
+            self.data_type.clone(),
+            &mut self.remaining,
+            self.chunk_size,
+            |dict| read_dict(self.data_type.clone(), dict),
+        );
+        match maybe_state {
+            MaybeNext::Some(Ok(dict)) => Some(Ok(dict)),
+            MaybeNext::Some(Err(e)) => Some(Err(e)),
+            MaybeNext::None => None,
+            MaybeNext::More => self.next(),
+        }
+    }
+}
+
+/// An iterator adapter that converts [`DataPages`] into an [`Iterator`] of [`DictionaryArray`].
+#[derive(Debug)]
+pub struct NestedDictIter<K, I>
+where
+    I: Pages,
+    K: DictionaryKey,
+{
+    iter: I,
+    init: Vec<InitNested>,
+    data_type: DataType,
+    values: Option<Box<dyn Array>>,
+    items: VecDeque<(NestedState, (Vec<K>, MutableBitmap))>,
+    remaining: usize,
+    chunk_size: Option<usize>,
+}
+
+impl<K, I> NestedDictIter<K, I>
+where
+    I: Pages,
+    K: DictionaryKey,
+{
+    pub fn new(
+        iter: I,
+        init: Vec<InitNested>,
+        data_type: DataType,
+        num_rows: usize,
+        chunk_size: Option<usize>,
+    ) -> Self {
+        Self {
+            iter,
+            init,
+            data_type,
+            values: None,
+            remaining: num_rows,
+            items: VecDeque::new(),
+            chunk_size,
+        }
+    }
+}
+
+impl<K, I> Iterator for NestedDictIter<K, I>
+where
+    I: Pages,
+    K: DictionaryKey,
+{
+    type Item = Result<(NestedState, DictionaryArray<K>)>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        let maybe_state = nested_next_dict(
+            &mut self.iter,
+            &mut self.items,
+            &mut self.remaining,
+            &self.init,
+            &mut self.values,
+            self.data_type.clone(),
+            self.chunk_size,
+            |dict| read_dict(self.data_type.clone(), dict),
+        );
+        match maybe_state {
+            MaybeNext::Some(Ok(dict)) => Some(Ok(dict)),
+            MaybeNext::Some(Err(e)) => Some(Err(e)),
+            MaybeNext::None => None,
+            MaybeNext::More => self.next(),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/fixed_size_binary/mod.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/fixed_size_binary/mod.rs
new file mode 100644
index 000000000000..c48bfe276bcc
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/fixed_size_binary/mod.rs
@@ -0,0 +1,8 @@
+mod basic;
+mod dictionary;
+mod nested;
+mod utils;
+
+pub use basic::Iter;
+pub use dictionary::{DictIter, NestedDictIter};
+pub use nested::NestedIter;
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/fixed_size_binary/nested.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/fixed_size_binary/nested.rs
new file mode 100644
index 000000000000..f2b65380baad
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/fixed_size_binary/nested.rs
@@ -0,0 +1,189 @@
+use std::collections::VecDeque;
+
+use parquet2::encoding::Encoding;
+use parquet2::page::{DataPage, DictPage};
+use parquet2::schema::Repetition;
+
+use super::super::utils::{not_implemented, MaybeNext, PageState};
+use super::utils::FixedSizeBinary;
+use crate::array::FixedSizeBinaryArray;
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::DataType;
+use crate::error::Result;
+use crate::io::parquet::read::deserialize::fixed_size_binary::basic::{
+    finish, Dict, Optional, OptionalDictionary, Required, RequiredDictionary,
+};
+use crate::io::parquet::read::deserialize::nested_utils::{next, NestedDecoder};
+use crate::io::parquet::read::deserialize::utils::Pushable;
+use crate::io::parquet::read::{InitNested, NestedState, Pages};
+
+#[derive(Debug)]
+enum State<'a> {
+    Optional(Optional<'a>),
+    Required(Required<'a>),
+    RequiredDictionary(RequiredDictionary<'a>),
+    OptionalDictionary(OptionalDictionary<'a>),
+}
+
+impl<'a> PageState<'a> for State<'a> {
+    fn len(&self) -> usize {
+        match self {
+            State::Optional(state) => state.validity.len(),
+            State::Required(state) => state.len(),
+            State::RequiredDictionary(state) => state.len(),
+            State::OptionalDictionary(state) => state.validity.len(),
+        }
+    }
+}
+
+#[derive(Debug, Default)]
+struct BinaryDecoder {
+    size: usize,
+}
+
+impl<'a> NestedDecoder<'a> for BinaryDecoder {
+    type State = State<'a>;
+    type Dictionary = Dict;
+    type DecodedState = (FixedSizeBinary, MutableBitmap);
+
+    fn build_state(
+        &self,
+        page: &'a DataPage,
+        dict: Option<&'a Self::Dictionary>,
+    ) -> Result<Self::State> {
+        let is_optional =
+            page.descriptor.primitive_type.field_info.repetition == Repetition::Optional;
+        let is_filtered = page.selected_rows().is_some();
+
+        match (page.encoding(), dict, is_optional, is_filtered) {
+            (Encoding::Plain, _, true, false) => {
+                Ok(State::Optional(Optional::try_new(page, self.size)?))
+            },
+            (Encoding::Plain, _, false, false) => {
+                Ok(State::Required(Required::new(page, self.size)))
+            },
+            (Encoding::PlainDictionary | Encoding::RleDictionary, Some(dict), false, false) => {
+                RequiredDictionary::try_new(page, dict).map(State::RequiredDictionary)
+            },
+            (Encoding::PlainDictionary | Encoding::RleDictionary, Some(dict), true, false) => {
+                OptionalDictionary::try_new(page, dict).map(State::OptionalDictionary)
+            },
+            _ => Err(not_implemented(page)),
+        }
+    }
+
+    fn with_capacity(&self, capacity: usize) -> Self::DecodedState {
+        (
+            FixedSizeBinary::with_capacity(capacity, self.size),
+            MutableBitmap::with_capacity(capacity),
+        )
+    }
+
+    fn push_valid(&self, state: &mut Self::State, decoded: &mut Self::DecodedState) -> Result<()> {
+        let (values, validity) = decoded;
+        match state {
+            State::Optional(page) => {
+                let value = page.values.by_ref().next().unwrap_or_default();
+                values.push(value);
+                validity.push(true);
+            },
+            State::Required(page) => {
+                let value = page.values.by_ref().next().unwrap_or_default();
+                values.push(value);
+            },
+            State::RequiredDictionary(page) => {
+                let item = page
+                    .values
+                    .by_ref()
+                    .next()
+                    .map(|index| {
+                        let index = index.unwrap() as usize;
+                        &page.dict[index * self.size..(index + 1) * self.size]
+                    })
+                    .unwrap_or_default();
+                values.push(item);
+            },
+            State::OptionalDictionary(page) => {
+                let item = page
+                    .values
+                    .by_ref()
+                    .next()
+                    .map(|index| {
+                        let index = index.unwrap() as usize;
+                        &page.dict[index * self.size..(index + 1) * self.size]
+                    })
+                    .unwrap_or_default();
+                values.push(item);
+                validity.push(true);
+            },
+        }
+        Ok(())
+    }
+
+    fn push_null(&self, decoded: &mut Self::DecodedState) {
+        let (values, validity) = decoded;
+        values.push_null();
+        validity.push(false);
+    }
+
+    fn deserialize_dict(&self, page: &DictPage) -> Self::Dictionary {
+        page.buffer.clone()
+    }
+}
+
+pub struct NestedIter<I: Pages> {
+    iter: I,
+    data_type: DataType,
+    size: usize,
+    init: Vec<InitNested>,
+    items: VecDeque<(NestedState, (FixedSizeBinary, MutableBitmap))>,
+    dict: Option<Dict>,
+    chunk_size: Option<usize>,
+    remaining: usize,
+}
+
+impl<I: Pages> NestedIter<I> {
+    pub fn new(
+        iter: I,
+        init: Vec<InitNested>,
+        data_type: DataType,
+        num_rows: usize,
+        chunk_size: Option<usize>,
+    ) -> Self {
+        let size = FixedSizeBinaryArray::get_size(&data_type);
+        Self {
+            iter,
+            data_type,
+            size,
+            init,
+            items: VecDeque::new(),
+            dict: None,
+            chunk_size,
+            remaining: num_rows,
+        }
+    }
+}
+
+impl<I: Pages> Iterator for NestedIter<I> {
+    type Item = Result<(NestedState, FixedSizeBinaryArray)>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        let maybe_state = next(
+            &mut self.iter,
+            &mut self.items,
+            &mut self.dict,
+            &mut self.remaining,
+            &self.init,
+            self.chunk_size,
+            &BinaryDecoder { size: self.size },
+        );
+        match maybe_state {
+            MaybeNext::Some(Ok((nested, decoded))) => {
+                Some(Ok((nested, finish(&self.data_type, decoded.0, decoded.1))))
+            },
+            MaybeNext::Some(Err(e)) => Some(Err(e)),
+            MaybeNext::None => None,
+            MaybeNext::More => self.next(),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/fixed_size_binary/utils.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/fixed_size_binary/utils.rs
new file mode 100644
index 000000000000..f718ce1bdc2b
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/fixed_size_binary/utils.rs
@@ -0,0 +1,58 @@
+use super::super::utils::Pushable;
+
+/// A [`Pushable`] for fixed sized binary data
+#[derive(Debug)]
+pub struct FixedSizeBinary {
+    pub values: Vec<u8>,
+    pub size: usize,
+}
+
+impl FixedSizeBinary {
+    #[inline]
+    pub fn with_capacity(capacity: usize, size: usize) -> Self {
+        Self {
+            values: Vec::with_capacity(capacity * size),
+            size,
+        }
+    }
+
+    #[inline]
+    pub fn push(&mut self, value: &[u8]) {
+        debug_assert_eq!(value.len(), self.size);
+        self.values.extend(value);
+    }
+
+    #[inline]
+    pub fn extend_constant(&mut self, additional: usize) {
+        self.values
+            .resize(self.values.len() + additional * self.size, 0);
+    }
+}
+
+impl<'a> Pushable<&'a [u8]> for FixedSizeBinary {
+    #[inline]
+    fn reserve(&mut self, additional: usize) {
+        self.values.reserve(additional * self.size);
+    }
+    #[inline]
+    fn push(&mut self, value: &[u8]) {
+        debug_assert_eq!(value.len(), self.size);
+        self.push(value);
+    }
+
+    #[inline]
+    fn push_null(&mut self) {
+        self.values.extend(std::iter::repeat(0).take(self.size))
+    }
+
+    #[inline]
+    fn extend_constant(&mut self, additional: usize, value: &[u8]) {
+        assert_eq!(value.len(), 0);
+        self.extend_constant(additional)
+    }
+
+    #[inline]
+    fn len(&self) -> usize {
+        self.values.len() / self.size
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/mod.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/mod.rs
new file mode 100644
index 000000000000..098430b3d154
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/mod.rs
@@ -0,0 +1,212 @@
+//! APIs to read from Parquet format.
+mod binary;
+mod boolean;
+mod dictionary;
+mod fixed_size_binary;
+mod nested;
+mod nested_utils;
+mod null;
+mod primitive;
+mod simple;
+mod struct_;
+mod utils;
+
+use parquet2::read::get_page_iterator as _get_page_iterator;
+use parquet2::schema::types::PrimitiveType;
+use simple::page_iter_to_arrays;
+
+pub use self::nested_utils::{init_nested, InitNested, NestedArrayIter, NestedState};
+pub use self::struct_::StructIterator;
+use super::*;
+use crate::array::{Array, DictionaryKey, FixedSizeListArray, ListArray, MapArray};
+use crate::datatypes::{DataType, Field, IntervalUnit};
+use crate::error::Result;
+use crate::offset::Offsets;
+
+/// Creates a new iterator of compressed pages.
+pub fn get_page_iterator<R: Read + Seek>(
+    column_metadata: &ColumnChunkMetaData,
+    reader: R,
+    pages_filter: Option<PageFilter>,
+    buffer: Vec<u8>,
+    max_header_size: usize,
+) -> Result<PageReader<R>> {
+    Ok(_get_page_iterator(
+        column_metadata,
+        reader,
+        pages_filter,
+        buffer,
+        max_header_size,
+    )?)
+}
+
+/// Creates a new [`ListArray`] or [`FixedSizeListArray`].
+pub fn create_list(
+    data_type: DataType,
+    nested: &mut NestedState,
+    values: Box<dyn Array>,
+) -> Box<dyn Array> {
+    let (mut offsets, validity) = nested.nested.pop().unwrap().inner();
+    match data_type.to_logical_type() {
+        DataType::List(_) => {
+            offsets.push(values.len() as i64);
+
+            let offsets = offsets.iter().map(|x| *x as i32).collect::<Vec<_>>();
+
+            let offsets: Offsets<i32> = offsets
+                .try_into()
+                .expect("i64 offsets do not fit in i32 offsets");
+
+            Box::new(ListArray::<i32>::new(
+                data_type,
+                offsets.into(),
+                values,
+                validity.and_then(|x| x.into()),
+            ))
+        },
+        DataType::LargeList(_) => {
+            offsets.push(values.len() as i64);
+
+            Box::new(ListArray::<i64>::new(
+                data_type,
+                offsets.try_into().expect("List too large"),
+                values,
+                validity.and_then(|x| x.into()),
+            ))
+        },
+        DataType::FixedSizeList(_, _) => Box::new(FixedSizeListArray::new(
+            data_type,
+            values,
+            validity.and_then(|x| x.into()),
+        )),
+        _ => unreachable!(),
+    }
+}
+
+/// Creates a new [`MapArray`].
+pub fn create_map(
+    data_type: DataType,
+    nested: &mut NestedState,
+    values: Box<dyn Array>,
+) -> Box<dyn Array> {
+    let (mut offsets, validity) = nested.nested.pop().unwrap().inner();
+    match data_type.to_logical_type() {
+        DataType::Map(_, _) => {
+            offsets.push(values.len() as i64);
+            let offsets = offsets.iter().map(|x| *x as i32).collect::<Vec<_>>();
+
+            let offsets: Offsets<i32> = offsets
+                .try_into()
+                .expect("i64 offsets do not fit in i32 offsets");
+
+            Box::new(MapArray::new(
+                data_type,
+                offsets.into(),
+                values,
+                validity.and_then(|x| x.into()),
+            ))
+        },
+        _ => unreachable!(),
+    }
+}
+
+fn is_primitive(data_type: &DataType) -> bool {
+    matches!(
+        data_type.to_physical_type(),
+        crate::datatypes::PhysicalType::Primitive(_)
+            | crate::datatypes::PhysicalType::Null
+            | crate::datatypes::PhysicalType::Boolean
+            | crate::datatypes::PhysicalType::Utf8
+            | crate::datatypes::PhysicalType::LargeUtf8
+            | crate::datatypes::PhysicalType::Binary
+            | crate::datatypes::PhysicalType::LargeBinary
+            | crate::datatypes::PhysicalType::FixedSizeBinary
+            | crate::datatypes::PhysicalType::Dictionary(_)
+    )
+}
+
+fn columns_to_iter_recursive<'a, I: 'a>(
+    mut columns: Vec<I>,
+    mut types: Vec<&PrimitiveType>,
+    field: Field,
+    init: Vec<InitNested>,
+    num_rows: usize,
+    chunk_size: Option<usize>,
+) -> Result<NestedArrayIter<'a>>
+where
+    I: Pages,
+{
+    if init.is_empty() && is_primitive(&field.data_type) {
+        return Ok(Box::new(
+            page_iter_to_arrays(
+                columns.pop().unwrap(),
+                types.pop().unwrap(),
+                field.data_type,
+                chunk_size,
+                num_rows,
+            )?
+            .map(|x| Ok((NestedState::new(vec![]), x?))),
+        ));
+    }
+
+    nested::columns_to_iter_recursive(columns, types, field, init, num_rows, chunk_size)
+}
+
+/// Returns the number of (parquet) columns that a [`DataType`] contains.
+pub fn n_columns(data_type: &DataType) -> usize {
+    use crate::datatypes::PhysicalType::*;
+    match data_type.to_physical_type() {
+        Null | Boolean | Primitive(_) | Binary | FixedSizeBinary | LargeBinary | Utf8
+        | Dictionary(_) | LargeUtf8 => 1,
+        List | FixedSizeList | LargeList => {
+            let a = data_type.to_logical_type();
+            if let DataType::List(inner) = a {
+                n_columns(&inner.data_type)
+            } else if let DataType::LargeList(inner) = a {
+                n_columns(&inner.data_type)
+            } else if let DataType::FixedSizeList(inner, _) = a {
+                n_columns(&inner.data_type)
+            } else {
+                unreachable!()
+            }
+        },
+        Map => {
+            let a = data_type.to_logical_type();
+            if let DataType::Map(inner, _) = a {
+                n_columns(&inner.data_type)
+            } else {
+                unreachable!()
+            }
+        },
+        Struct => {
+            if let DataType::Struct(fields) = data_type.to_logical_type() {
+                fields.iter().map(|inner| n_columns(&inner.data_type)).sum()
+            } else {
+                unreachable!()
+            }
+        },
+        _ => todo!(),
+    }
+}
+
+/// An iterator adapter that maps multiple iterators of [`Pages`] into an iterator of [`Array`]s.
+///
+/// For a non-nested datatypes such as [`DataType::Int32`], this function requires a single element in `columns` and `types`.
+/// For nested types, `columns` must be composed by all parquet columns with associated types `types`.
+///
+/// The arrays are guaranteed to be at most of size `chunk_size` and data type `field.data_type`.
+pub fn column_iter_to_arrays<'a, I: 'a>(
+    columns: Vec<I>,
+    types: Vec<&PrimitiveType>,
+    field: Field,
+    chunk_size: Option<usize>,
+    num_rows: usize,
+) -> Result<ArrayIter<'a>>
+where
+    I: Pages,
+{
+    Ok(Box::new(
+        columns_to_iter_recursive(columns, types, field, vec![], num_rows, chunk_size)?
+            .map(|x| x.map(|x| x.1)),
+    ))
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/nested.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/nested.rs
new file mode 100644
index 000000000000..14f75fa8d672
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/nested.rs
@@ -0,0 +1,590 @@
+use ethnum::I256;
+use parquet2::schema::types::PrimitiveType;
+
+use super::nested_utils::{InitNested, NestedArrayIter};
+use super::*;
+use crate::array::PrimitiveArray;
+use crate::datatypes::{DataType, Field};
+use crate::error::{Error, Result};
+
+/// Converts an iterator of arrays to a trait object returning trait objects
+#[inline]
+fn remove_nested<'a, I>(iter: I) -> NestedArrayIter<'a>
+where
+    I: Iterator<Item = Result<(NestedState, Box<dyn Array>)>> + Send + Sync + 'a,
+{
+    Box::new(iter.map(|x| {
+        x.map(|(mut nested, array)| {
+            let _ = nested.nested.pop().unwrap(); // the primitive
+            (nested, array)
+        })
+    }))
+}
+
+/// Converts an iterator of arrays to a trait object returning trait objects
+#[inline]
+fn primitive<'a, A, I>(iter: I) -> NestedArrayIter<'a>
+where
+    A: Array,
+    I: Iterator<Item = Result<(NestedState, A)>> + Send + Sync + 'a,
+{
+    Box::new(iter.map(|x| {
+        x.map(|(mut nested, array)| {
+            let _ = nested.nested.pop().unwrap(); // the primitive
+            (nested, Box::new(array) as _)
+        })
+    }))
+}
+
+pub fn columns_to_iter_recursive<'a, I: 'a>(
+    mut columns: Vec<I>,
+    mut types: Vec<&PrimitiveType>,
+    field: Field,
+    mut init: Vec<InitNested>,
+    num_rows: usize,
+    chunk_size: Option<usize>,
+) -> Result<NestedArrayIter<'a>>
+where
+    I: Pages,
+{
+    use crate::datatypes::PhysicalType::*;
+    use crate::datatypes::PrimitiveType::*;
+
+    Ok(match field.data_type().to_physical_type() {
+        Null => {
+            // physical type is i32
+            init.push(InitNested::Primitive(field.is_nullable));
+            types.pop();
+            primitive(null::NestedIter::new(
+                columns.pop().unwrap(),
+                init,
+                field.data_type().clone(),
+                num_rows,
+                chunk_size,
+            ))
+        },
+        Boolean => {
+            init.push(InitNested::Primitive(field.is_nullable));
+            types.pop();
+            primitive(boolean::NestedIter::new(
+                columns.pop().unwrap(),
+                init,
+                num_rows,
+                chunk_size,
+            ))
+        },
+        Primitive(Int8) => {
+            init.push(InitNested::Primitive(field.is_nullable));
+            types.pop();
+            primitive(primitive::NestedIter::new(
+                columns.pop().unwrap(),
+                init,
+                field.data_type().clone(),
+                num_rows,
+                chunk_size,
+                |x: i32| x as i8,
+            ))
+        },
+        Primitive(Int16) => {
+            init.push(InitNested::Primitive(field.is_nullable));
+            types.pop();
+            primitive(primitive::NestedIter::new(
+                columns.pop().unwrap(),
+                init,
+                field.data_type().clone(),
+                num_rows,
+                chunk_size,
+                |x: i32| x as i16,
+            ))
+        },
+        Primitive(Int32) => {
+            init.push(InitNested::Primitive(field.is_nullable));
+            types.pop();
+            primitive(primitive::NestedIter::new(
+                columns.pop().unwrap(),
+                init,
+                field.data_type().clone(),
+                num_rows,
+                chunk_size,
+                |x: i32| x,
+            ))
+        },
+        Primitive(Int64) => {
+            init.push(InitNested::Primitive(field.is_nullable));
+            types.pop();
+            primitive(primitive::NestedIter::new(
+                columns.pop().unwrap(),
+                init,
+                field.data_type().clone(),
+                num_rows,
+                chunk_size,
+                |x: i64| x,
+            ))
+        },
+        Primitive(UInt8) => {
+            init.push(InitNested::Primitive(field.is_nullable));
+            types.pop();
+            primitive(primitive::NestedIter::new(
+                columns.pop().unwrap(),
+                init,
+                field.data_type().clone(),
+                num_rows,
+                chunk_size,
+                |x: i32| x as u8,
+            ))
+        },
+        Primitive(UInt16) => {
+            init.push(InitNested::Primitive(field.is_nullable));
+            types.pop();
+            primitive(primitive::NestedIter::new(
+                columns.pop().unwrap(),
+                init,
+                field.data_type().clone(),
+                num_rows,
+                chunk_size,
+                |x: i32| x as u16,
+            ))
+        },
+        Primitive(UInt32) => {
+            init.push(InitNested::Primitive(field.is_nullable));
+            let type_ = types.pop().unwrap();
+            match type_.physical_type {
+                PhysicalType::Int32 => primitive(primitive::NestedIter::new(
+                    columns.pop().unwrap(),
+                    init,
+                    field.data_type().clone(),
+                    num_rows,
+                    chunk_size,
+                    |x: i32| x as u32,
+                )),
+                // some implementations of parquet write arrow's u32 into i64.
+                PhysicalType::Int64 => primitive(primitive::NestedIter::new(
+                    columns.pop().unwrap(),
+                    init,
+                    field.data_type().clone(),
+                    num_rows,
+                    chunk_size,
+                    |x: i64| x as u32,
+                )),
+                other => {
+                    return Err(Error::nyi(format!(
+                        "Deserializing UInt32 from {other:?}'s parquet"
+                    )))
+                },
+            }
+        },
+        Primitive(UInt64) => {
+            init.push(InitNested::Primitive(field.is_nullable));
+            types.pop();
+            primitive(primitive::NestedIter::new(
+                columns.pop().unwrap(),
+                init,
+                field.data_type().clone(),
+                num_rows,
+                chunk_size,
+                |x: i64| x as u64,
+            ))
+        },
+        Primitive(Float32) => {
+            init.push(InitNested::Primitive(field.is_nullable));
+            types.pop();
+            primitive(primitive::NestedIter::new(
+                columns.pop().unwrap(),
+                init,
+                field.data_type().clone(),
+                num_rows,
+                chunk_size,
+                |x: f32| x,
+            ))
+        },
+        Primitive(Float64) => {
+            init.push(InitNested::Primitive(field.is_nullable));
+            types.pop();
+            primitive(primitive::NestedIter::new(
+                columns.pop().unwrap(),
+                init,
+                field.data_type().clone(),
+                num_rows,
+                chunk_size,
+                |x: f64| x,
+            ))
+        },
+        Binary | Utf8 => {
+            init.push(InitNested::Primitive(field.is_nullable));
+            types.pop();
+            remove_nested(binary::NestedIter::<i32, _>::new(
+                columns.pop().unwrap(),
+                init,
+                field.data_type().clone(),
+                num_rows,
+                chunk_size,
+            ))
+        },
+        LargeBinary | LargeUtf8 => {
+            init.push(InitNested::Primitive(field.is_nullable));
+            types.pop();
+            remove_nested(binary::NestedIter::<i64, _>::new(
+                columns.pop().unwrap(),
+                init,
+                field.data_type().clone(),
+                num_rows,
+                chunk_size,
+            ))
+        },
+        _ => match field.data_type().to_logical_type() {
+            DataType::Dictionary(key_type, _, _) => {
+                init.push(InitNested::Primitive(field.is_nullable));
+                let type_ = types.pop().unwrap();
+                let iter = columns.pop().unwrap();
+                let data_type = field.data_type().clone();
+                match_integer_type!(key_type, |$K| {
+                    dict_read::<$K, _>(iter, init, type_, data_type, num_rows, chunk_size)
+                })?
+            },
+            DataType::List(inner)
+            | DataType::LargeList(inner)
+            | DataType::FixedSizeList(inner, _) => {
+                init.push(InitNested::List(field.is_nullable));
+                let iter = columns_to_iter_recursive(
+                    columns,
+                    types,
+                    inner.as_ref().clone(),
+                    init,
+                    num_rows,
+                    chunk_size,
+                )?;
+                let iter = iter.map(move |x| {
+                    let (mut nested, array) = x?;
+                    let array = create_list(field.data_type().clone(), &mut nested, array);
+                    Ok((nested, array))
+                });
+                Box::new(iter) as _
+            },
+            DataType::Decimal(_, _) => {
+                init.push(InitNested::Primitive(field.is_nullable));
+                let type_ = types.pop().unwrap();
+                match type_.physical_type {
+                    PhysicalType::Int32 => primitive(primitive::NestedIter::new(
+                        columns.pop().unwrap(),
+                        init,
+                        field.data_type.clone(),
+                        num_rows,
+                        chunk_size,
+                        |x: i32| x as i128,
+                    )),
+                    PhysicalType::Int64 => primitive(primitive::NestedIter::new(
+                        columns.pop().unwrap(),
+                        init,
+                        field.data_type.clone(),
+                        num_rows,
+                        chunk_size,
+                        |x: i64| x as i128,
+                    )),
+                    PhysicalType::FixedLenByteArray(n) if n > 16 => {
+                        return Err(Error::InvalidArgumentError(format!(
+                            "Can't decode Decimal128 type from `FixedLenByteArray` of len {n}"
+                        )))
+                    },
+                    PhysicalType::FixedLenByteArray(n) => {
+                        let iter = fixed_size_binary::NestedIter::new(
+                            columns.pop().unwrap(),
+                            init,
+                            DataType::FixedSizeBinary(n),
+                            num_rows,
+                            chunk_size,
+                        );
+                        // Convert the fixed length byte array to Decimal.
+                        let iter = iter.map(move |x| {
+                            let (mut nested, array) = x?;
+                            let values = array
+                                .values()
+                                .chunks_exact(n)
+                                .map(|value: &[u8]| super::super::convert_i128(value, n))
+                                .collect::<Vec<_>>();
+                            let validity = array.validity().cloned();
+
+                            let array: Box<dyn Array> = Box::new(PrimitiveArray::<i128>::try_new(
+                                field.data_type.clone(),
+                                values.into(),
+                                validity,
+                            )?);
+
+                            let _ = nested.nested.pop().unwrap(); // the primitive
+
+                            Ok((nested, array))
+                        });
+                        Box::new(iter)
+                    },
+                    _ => {
+                        return Err(Error::nyi(format!(
+                            "Deserializing type for Decimal {:?} from parquet",
+                            type_.physical_type
+                        )))
+                    },
+                }
+            },
+            DataType::Decimal256(_, _) => {
+                init.push(InitNested::Primitive(field.is_nullable));
+                let type_ = types.pop().unwrap();
+                match type_.physical_type {
+                    PhysicalType::Int32 => primitive(primitive::NestedIter::new(
+                        columns.pop().unwrap(),
+                        init,
+                        field.data_type.clone(),
+                        num_rows,
+                        chunk_size,
+                        |x: i32| i256(I256::new(x as i128)),
+                    )),
+                    PhysicalType::Int64 => primitive(primitive::NestedIter::new(
+                        columns.pop().unwrap(),
+                        init,
+                        field.data_type.clone(),
+                        num_rows,
+                        chunk_size,
+                        |x: i64| i256(I256::new(x as i128)),
+                    )),
+                    PhysicalType::FixedLenByteArray(n) if n <= 16 => {
+                        let iter = fixed_size_binary::NestedIter::new(
+                            columns.pop().unwrap(),
+                            init,
+                            DataType::FixedSizeBinary(n),
+                            num_rows,
+                            chunk_size,
+                        );
+                        // Convert the fixed length byte array to Decimal.
+                        let iter = iter.map(move |x| {
+                            let (mut nested, array) = x?;
+                            let values = array
+                                .values()
+                                .chunks_exact(n)
+                                .map(|value| i256(I256::new(super::super::convert_i128(value, n))))
+                                .collect::<Vec<_>>();
+                            let validity = array.validity().cloned();
+
+                            let array: Box<dyn Array> = Box::new(PrimitiveArray::<i256>::try_new(
+                                field.data_type.clone(),
+                                values.into(),
+                                validity,
+                            )?);
+
+                            let _ = nested.nested.pop().unwrap(); // the primitive
+
+                            Ok((nested, array))
+                        });
+                        Box::new(iter) as _
+                    },
+
+                    PhysicalType::FixedLenByteArray(n) if n <= 32 => {
+                        let iter = fixed_size_binary::NestedIter::new(
+                            columns.pop().unwrap(),
+                            init,
+                            DataType::FixedSizeBinary(n),
+                            num_rows,
+                            chunk_size,
+                        );
+                        // Convert the fixed length byte array to Decimal.
+                        let iter = iter.map(move |x| {
+                            let (mut nested, array) = x?;
+                            let values = array
+                                .values()
+                                .chunks_exact(n)
+                                .map(super::super::convert_i256)
+                                .collect::<Vec<_>>();
+                            let validity = array.validity().cloned();
+
+                            let array: Box<dyn Array> = Box::new(PrimitiveArray::<i256>::try_new(
+                                field.data_type.clone(),
+                                values.into(),
+                                validity,
+                            )?);
+
+                            let _ = nested.nested.pop().unwrap(); // the primitive
+
+                            Ok((nested, array))
+                        });
+                        Box::new(iter) as _
+                    },
+                    PhysicalType::FixedLenByteArray(n) => {
+                        return Err(Error::InvalidArgumentError(format!(
+                            "Can't decode Decimal256 type from from `FixedLenByteArray` of len {n}"
+                        )))
+                    },
+                    _ => {
+                        return Err(Error::nyi(format!(
+                            "Deserializing type for Decimal {:?} from parquet",
+                            type_.physical_type
+                        )))
+                    },
+                }
+            },
+            DataType::Struct(fields) => {
+                let columns = fields
+                    .iter()
+                    .rev()
+                    .map(|f| {
+                        let mut init = init.clone();
+                        init.push(InitNested::Struct(field.is_nullable));
+                        let n = n_columns(&f.data_type);
+                        let columns = columns.drain(columns.len() - n..).collect();
+                        let types = types.drain(types.len() - n..).collect();
+                        columns_to_iter_recursive(
+                            columns,
+                            types,
+                            f.clone(),
+                            init,
+                            num_rows,
+                            chunk_size,
+                        )
+                    })
+                    .collect::<Result<Vec<_>>>()?;
+                let columns = columns.into_iter().rev().collect();
+                Box::new(struct_::StructIterator::new(columns, fields.clone()))
+            },
+            DataType::Map(inner, _) => {
+                init.push(InitNested::List(field.is_nullable));
+                let iter = columns_to_iter_recursive(
+                    columns,
+                    types,
+                    inner.as_ref().clone(),
+                    init,
+                    num_rows,
+                    chunk_size,
+                )?;
+                let iter = iter.map(move |x| {
+                    let (mut nested, array) = x?;
+                    let array = create_map(field.data_type().clone(), &mut nested, array);
+                    Ok((nested, array))
+                });
+                Box::new(iter) as _
+            },
+            other => {
+                return Err(Error::nyi(format!(
+                    "Deserializing type {other:?} from parquet"
+                )))
+            },
+        },
+    })
+}
+
+fn dict_read<'a, K: DictionaryKey, I: 'a + Pages>(
+    iter: I,
+    init: Vec<InitNested>,
+    _type_: &PrimitiveType,
+    data_type: DataType,
+    num_rows: usize,
+    chunk_size: Option<usize>,
+) -> Result<NestedArrayIter<'a>> {
+    use DataType::*;
+    let values_data_type = if let Dictionary(_, v, _) = &data_type {
+        v.as_ref()
+    } else {
+        panic!()
+    };
+
+    Ok(match values_data_type.to_logical_type() {
+        UInt8 => primitive(primitive::NestedDictIter::<K, _, _, _, _>::new(
+            iter,
+            init,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i32| x as u8,
+        )),
+        UInt16 => primitive(primitive::NestedDictIter::<K, _, _, _, _>::new(
+            iter,
+            init,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i32| x as u16,
+        )),
+        UInt32 => primitive(primitive::NestedDictIter::<K, _, _, _, _>::new(
+            iter,
+            init,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i32| x as u32,
+        )),
+        Int8 => primitive(primitive::NestedDictIter::<K, _, _, _, _>::new(
+            iter,
+            init,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i32| x as i8,
+        )),
+        Int16 => primitive(primitive::NestedDictIter::<K, _, _, _, _>::new(
+            iter,
+            init,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i32| x as i16,
+        )),
+        Int32 | Date32 | Time32(_) | Interval(IntervalUnit::YearMonth) => {
+            primitive(primitive::NestedDictIter::<K, _, _, _, _>::new(
+                iter,
+                init,
+                data_type,
+                num_rows,
+                chunk_size,
+                |x: i32| x,
+            ))
+        },
+        Int64 | Date64 | Time64(_) | Duration(_) => {
+            primitive(primitive::NestedDictIter::<K, _, _, _, _>::new(
+                iter,
+                init,
+                data_type,
+                num_rows,
+                chunk_size,
+                |x: i64| x as i32,
+            ))
+        },
+        Float32 => primitive(primitive::NestedDictIter::<K, _, _, _, _>::new(
+            iter,
+            init,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: f32| x,
+        )),
+        Float64 => primitive(primitive::NestedDictIter::<K, _, _, _, _>::new(
+            iter,
+            init,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: f64| x,
+        )),
+        Utf8 | Binary => primitive(binary::NestedDictIter::<K, i32, _>::new(
+            iter, init, data_type, num_rows, chunk_size,
+        )),
+        LargeUtf8 | LargeBinary => primitive(binary::NestedDictIter::<K, i64, _>::new(
+            iter, init, data_type, num_rows, chunk_size,
+        )),
+        FixedSizeBinary(_) => primitive(fixed_size_binary::NestedDictIter::<K, _>::new(
+            iter, init, data_type, num_rows, chunk_size,
+        )),
+        /*
+
+        Timestamp(time_unit, _) => {
+            let time_unit = *time_unit;
+            return timestamp_dict::<K, _>(
+                iter,
+                physical_type,
+                logical_type,
+                data_type,
+                chunk_size,
+                time_unit,
+            );
+        }
+         */
+        other => {
+            return Err(Error::nyi(format!(
+                "Reading nested dictionaries of type {other:?}"
+            )))
+        },
+    })
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/nested_utils.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/nested_utils.rs
new file mode 100644
index 000000000000..fc68080e0799
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/nested_utils.rs
@@ -0,0 +1,556 @@
+use std::collections::VecDeque;
+
+use parquet2::encoding::hybrid_rle::HybridRleDecoder;
+use parquet2::page::{split_buffer, DataPage, DictPage, Page};
+use parquet2::read::levels::get_bit_width;
+
+use super::super::Pages;
+pub use super::utils::Zip;
+use super::utils::{DecodedState, MaybeNext, PageState};
+use crate::array::Array;
+use crate::bitmap::MutableBitmap;
+use crate::error::Result;
+
+/// trait describing deserialized repetition and definition levels
+pub trait Nested: std::fmt::Debug + Send + Sync {
+    fn inner(&mut self) -> (Vec<i64>, Option<MutableBitmap>);
+
+    fn push(&mut self, length: i64, is_valid: bool);
+
+    fn is_nullable(&self) -> bool;
+
+    fn is_repeated(&self) -> bool {
+        false
+    }
+
+    // Whether the Arrow container requires all items to be filled.
+    fn is_required(&self) -> bool;
+
+    /// number of rows
+    fn len(&self) -> usize;
+
+    /// number of values associated to the primitive type this nested tracks
+    fn num_values(&self) -> usize;
+}
+
+#[derive(Debug, Default)]
+pub struct NestedPrimitive {
+    is_nullable: bool,
+    length: usize,
+}
+
+impl NestedPrimitive {
+    pub fn new(is_nullable: bool) -> Self {
+        Self {
+            is_nullable,
+            length: 0,
+        }
+    }
+}
+
+impl Nested for NestedPrimitive {
+    fn inner(&mut self) -> (Vec<i64>, Option<MutableBitmap>) {
+        (Default::default(), Default::default())
+    }
+
+    fn is_nullable(&self) -> bool {
+        self.is_nullable
+    }
+
+    fn is_required(&self) -> bool {
+        false
+    }
+
+    fn push(&mut self, _value: i64, _is_valid: bool) {
+        self.length += 1
+    }
+
+    fn len(&self) -> usize {
+        self.length
+    }
+
+    fn num_values(&self) -> usize {
+        self.length
+    }
+}
+
+#[derive(Debug, Default)]
+pub struct NestedOptional {
+    pub validity: MutableBitmap,
+    pub offsets: Vec<i64>,
+}
+
+impl Nested for NestedOptional {
+    fn inner(&mut self) -> (Vec<i64>, Option<MutableBitmap>) {
+        let offsets = std::mem::take(&mut self.offsets);
+        let validity = std::mem::take(&mut self.validity);
+        (offsets, Some(validity))
+    }
+
+    fn is_nullable(&self) -> bool {
+        true
+    }
+
+    fn is_repeated(&self) -> bool {
+        true
+    }
+
+    fn is_required(&self) -> bool {
+        // it may be for FixedSizeList
+        false
+    }
+
+    fn push(&mut self, value: i64, is_valid: bool) {
+        self.offsets.push(value);
+        self.validity.push(is_valid);
+    }
+
+    fn len(&self) -> usize {
+        self.offsets.len()
+    }
+
+    fn num_values(&self) -> usize {
+        self.offsets.last().copied().unwrap_or(0) as usize
+    }
+}
+
+impl NestedOptional {
+    pub fn with_capacity(capacity: usize) -> Self {
+        let offsets = Vec::<i64>::with_capacity(capacity + 1);
+        let validity = MutableBitmap::with_capacity(capacity);
+        Self { validity, offsets }
+    }
+}
+
+#[derive(Debug, Default)]
+pub struct NestedValid {
+    pub offsets: Vec<i64>,
+}
+
+impl Nested for NestedValid {
+    fn inner(&mut self) -> (Vec<i64>, Option<MutableBitmap>) {
+        let offsets = std::mem::take(&mut self.offsets);
+        (offsets, None)
+    }
+
+    fn is_nullable(&self) -> bool {
+        false
+    }
+
+    fn is_repeated(&self) -> bool {
+        true
+    }
+
+    fn is_required(&self) -> bool {
+        // it may be for FixedSizeList
+        false
+    }
+
+    fn push(&mut self, value: i64, _is_valid: bool) {
+        self.offsets.push(value);
+    }
+
+    fn len(&self) -> usize {
+        self.offsets.len()
+    }
+
+    fn num_values(&self) -> usize {
+        self.offsets.last().copied().unwrap_or(0) as usize
+    }
+}
+
+impl NestedValid {
+    pub fn with_capacity(capacity: usize) -> Self {
+        let offsets = Vec::<i64>::with_capacity(capacity + 1);
+        Self { offsets }
+    }
+}
+
+#[derive(Debug, Default)]
+pub struct NestedStructValid {
+    length: usize,
+}
+
+impl NestedStructValid {
+    pub fn new() -> Self {
+        Self { length: 0 }
+    }
+}
+
+impl Nested for NestedStructValid {
+    fn inner(&mut self) -> (Vec<i64>, Option<MutableBitmap>) {
+        (Default::default(), None)
+    }
+
+    fn is_nullable(&self) -> bool {
+        false
+    }
+
+    fn is_required(&self) -> bool {
+        true
+    }
+
+    fn push(&mut self, _value: i64, _is_valid: bool) {
+        self.length += 1;
+    }
+
+    fn len(&self) -> usize {
+        self.length
+    }
+
+    fn num_values(&self) -> usize {
+        self.length
+    }
+}
+
+#[derive(Debug, Default)]
+pub struct NestedStruct {
+    validity: MutableBitmap,
+}
+
+impl NestedStruct {
+    pub fn with_capacity(capacity: usize) -> Self {
+        Self {
+            validity: MutableBitmap::with_capacity(capacity),
+        }
+    }
+}
+
+impl Nested for NestedStruct {
+    fn inner(&mut self) -> (Vec<i64>, Option<MutableBitmap>) {
+        (Default::default(), Some(std::mem::take(&mut self.validity)))
+    }
+
+    fn is_nullable(&self) -> bool {
+        true
+    }
+
+    fn is_required(&self) -> bool {
+        true
+    }
+
+    fn push(&mut self, _value: i64, is_valid: bool) {
+        self.validity.push(is_valid)
+    }
+
+    fn len(&self) -> usize {
+        self.validity.len()
+    }
+
+    fn num_values(&self) -> usize {
+        self.validity.len()
+    }
+}
+
+/// A decoder that knows how to map `State` -> Array
+pub(super) trait NestedDecoder<'a> {
+    type State: PageState<'a>;
+    type Dictionary;
+    type DecodedState: DecodedState;
+
+    fn build_state(
+        &self,
+        page: &'a DataPage,
+        dict: Option<&'a Self::Dictionary>,
+    ) -> Result<Self::State>;
+
+    /// Initializes a new state
+    fn with_capacity(&self, capacity: usize) -> Self::DecodedState;
+
+    fn push_valid(&self, state: &mut Self::State, decoded: &mut Self::DecodedState) -> Result<()>;
+    fn push_null(&self, decoded: &mut Self::DecodedState);
+
+    fn deserialize_dict(&self, page: &DictPage) -> Self::Dictionary;
+}
+
+/// The initial info of nested data types.
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+pub enum InitNested {
+    /// Primitive data types
+    Primitive(bool),
+    /// List data types
+    List(bool),
+    /// Struct data types
+    Struct(bool),
+}
+
+/// Initialize [`NestedState`] from `&[InitNested]`.
+pub fn init_nested(init: &[InitNested], capacity: usize) -> NestedState {
+    let container = init
+        .iter()
+        .map(|init| match init {
+            InitNested::Primitive(is_nullable) => {
+                Box::new(NestedPrimitive::new(*is_nullable)) as Box<dyn Nested>
+            },
+            InitNested::List(is_nullable) => {
+                if *is_nullable {
+                    Box::new(NestedOptional::with_capacity(capacity)) as Box<dyn Nested>
+                } else {
+                    Box::new(NestedValid::with_capacity(capacity)) as Box<dyn Nested>
+                }
+            },
+            InitNested::Struct(is_nullable) => {
+                if *is_nullable {
+                    Box::new(NestedStruct::with_capacity(capacity)) as Box<dyn Nested>
+                } else {
+                    Box::new(NestedStructValid::new()) as Box<dyn Nested>
+                }
+            },
+        })
+        .collect();
+    NestedState::new(container)
+}
+
+pub struct NestedPage<'a> {
+    iter: std::iter::Peekable<std::iter::Zip<HybridRleDecoder<'a>, HybridRleDecoder<'a>>>,
+}
+
+impl<'a> NestedPage<'a> {
+    pub fn try_new(page: &'a DataPage) -> Result<Self> {
+        let (rep_levels, def_levels, _) = split_buffer(page)?;
+
+        let max_rep_level = page.descriptor.max_rep_level;
+        let max_def_level = page.descriptor.max_def_level;
+
+        let reps =
+            HybridRleDecoder::try_new(rep_levels, get_bit_width(max_rep_level), page.num_values())?;
+        let defs =
+            HybridRleDecoder::try_new(def_levels, get_bit_width(max_def_level), page.num_values())?;
+
+        let iter = reps.zip(defs).peekable();
+
+        Ok(Self { iter })
+    }
+
+    // number of values (!= number of rows)
+    pub fn len(&self) -> usize {
+        self.iter.size_hint().0
+    }
+}
+
+/// The state of nested data types.
+#[derive(Debug)]
+pub struct NestedState {
+    /// The nesteds composing `NestedState`.
+    pub nested: Vec<Box<dyn Nested>>,
+}
+
+impl NestedState {
+    /// Creates a new [`NestedState`].
+    pub fn new(nested: Vec<Box<dyn Nested>>) -> Self {
+        Self { nested }
+    }
+
+    /// The number of rows in this state
+    pub fn len(&self) -> usize {
+        // outermost is the number of rows
+        self.nested[0].len()
+    }
+}
+
+/// Extends `items` by consuming `page`, first trying to complete the last `item`
+/// and extending it if more are needed
+pub(super) fn extend<'a, D: NestedDecoder<'a>>(
+    page: &'a DataPage,
+    init: &[InitNested],
+    items: &mut VecDeque<(NestedState, D::DecodedState)>,
+    dict: Option<&'a D::Dictionary>,
+    remaining: &mut usize,
+    decoder: &D,
+    chunk_size: Option<usize>,
+) -> Result<()> {
+    let mut values_page = decoder.build_state(page, dict)?;
+    let mut page = NestedPage::try_new(page)?;
+
+    let capacity = chunk_size.unwrap_or(0);
+    // chunk_size = None, remaining = 44 => chunk_size = 44
+    let chunk_size = chunk_size.unwrap_or(usize::MAX);
+
+    let (mut nested, mut decoded) = if let Some((nested, decoded)) = items.pop_back() {
+        (nested, decoded)
+    } else {
+        // there is no state => initialize it
+        (init_nested(init, capacity), decoder.with_capacity(0))
+    };
+    let existing = nested.len();
+
+    let additional = (chunk_size - existing).min(*remaining);
+
+    // extend the current state
+    extend_offsets2(
+        &mut page,
+        &mut values_page,
+        &mut nested.nested,
+        &mut decoded,
+        decoder,
+        additional,
+    )?;
+    *remaining -= nested.len() - existing;
+    items.push_back((nested, decoded));
+
+    while page.len() > 0 && *remaining > 0 {
+        let additional = chunk_size.min(*remaining);
+
+        let mut nested = init_nested(init, additional);
+        let mut decoded = decoder.with_capacity(0);
+        extend_offsets2(
+            &mut page,
+            &mut values_page,
+            &mut nested.nested,
+            &mut decoded,
+            decoder,
+            additional,
+        )?;
+        *remaining -= nested.len();
+        items.push_back((nested, decoded));
+    }
+    Ok(())
+}
+
+fn extend_offsets2<'a, D: NestedDecoder<'a>>(
+    page: &mut NestedPage<'a>,
+    values_state: &mut D::State,
+    nested: &mut [Box<dyn Nested>],
+    decoded: &mut D::DecodedState,
+    decoder: &D,
+    additional: usize,
+) -> Result<()> {
+    let max_depth = nested.len();
+
+    let mut cum_sum = vec![0u32; max_depth + 1];
+    for (i, nest) in nested.iter().enumerate() {
+        let delta = nest.is_nullable() as u32 + nest.is_repeated() as u32;
+        cum_sum[i + 1] = cum_sum[i] + delta;
+    }
+
+    let mut cum_rep = vec![0u32; max_depth + 1];
+    for (i, nest) in nested.iter().enumerate() {
+        let delta = nest.is_repeated() as u32;
+        cum_rep[i + 1] = cum_rep[i] + delta;
+    }
+
+    let mut rows = 0;
+    while let Some((rep, def)) = page.iter.next() {
+        let rep = rep?;
+        let def = def?;
+        if rep == 0 {
+            rows += 1;
+        }
+
+        let mut is_required = false;
+        for depth in 0..max_depth {
+            let right_level = rep <= cum_rep[depth] && def >= cum_sum[depth];
+            if is_required || right_level {
+                let length = nested
+                    .get(depth + 1)
+                    .map(|x| x.len() as i64)
+                    // the last depth is the leaf, which is always increased by 1
+                    .unwrap_or(1);
+
+                let nest = &mut nested[depth];
+
+                let is_valid = nest.is_nullable() && def > cum_sum[depth];
+                nest.push(length, is_valid);
+                is_required = nest.is_required() && !is_valid;
+
+                if depth == max_depth - 1 {
+                    // the leaf / primitive
+                    let is_valid = (def != cum_sum[depth]) || !nest.is_nullable();
+                    if right_level && is_valid {
+                        decoder.push_valid(values_state, decoded)?;
+                    } else {
+                        decoder.push_null(decoded);
+                    }
+                }
+            }
+        }
+
+        let next_rep = *page
+            .iter
+            .peek()
+            .map(|x| x.0.as_ref())
+            .transpose()
+            .unwrap() // todo: fix this
+            .unwrap_or(&0);
+
+        if next_rep == 0 && rows == additional {
+            break;
+        }
+    }
+    Ok(())
+}
+
+#[inline]
+pub(super) fn next<'a, I, D>(
+    iter: &'a mut I,
+    items: &mut VecDeque<(NestedState, D::DecodedState)>,
+    dict: &'a mut Option<D::Dictionary>,
+    remaining: &mut usize,
+    init: &[InitNested],
+    chunk_size: Option<usize>,
+    decoder: &D,
+) -> MaybeNext<Result<(NestedState, D::DecodedState)>>
+where
+    I: Pages,
+    D: NestedDecoder<'a>,
+{
+    // front[a1, a2, a3, ...]back
+    if items.len() > 1 {
+        return MaybeNext::Some(Ok(items.pop_front().unwrap()));
+    }
+    if (items.len() == 1) && items.front().unwrap().0.len() == chunk_size.unwrap_or(usize::MAX) {
+        return MaybeNext::Some(Ok(items.pop_front().unwrap()));
+    }
+    if *remaining == 0 {
+        return match items.pop_front() {
+            Some(decoded) => MaybeNext::Some(Ok(decoded)),
+            None => MaybeNext::None,
+        };
+    }
+    match iter.next() {
+        Err(e) => MaybeNext::Some(Err(e.into())),
+        Ok(None) => {
+            if let Some(decoded) = items.pop_front() {
+                MaybeNext::Some(Ok(decoded))
+            } else {
+                MaybeNext::None
+            }
+        },
+        Ok(Some(page)) => {
+            let page = match page {
+                Page::Data(page) => page,
+                Page::Dict(dict_page) => {
+                    *dict = Some(decoder.deserialize_dict(dict_page));
+                    return MaybeNext::More;
+                },
+            };
+
+            // there is a new page => consume the page from the start
+            let error = extend(
+                page,
+                init,
+                items,
+                dict.as_ref(),
+                remaining,
+                decoder,
+                chunk_size,
+            );
+            match error {
+                Ok(_) => {},
+                Err(e) => return MaybeNext::Some(Err(e)),
+            };
+
+            if (items.len() == 1)
+                && items.front().unwrap().0.len() < chunk_size.unwrap_or(usize::MAX)
+            {
+                MaybeNext::More
+            } else {
+                MaybeNext::Some(Ok(items.pop_front().unwrap()))
+            }
+        },
+    }
+}
+
+/// Type def for a sharable, boxed dyn [`Iterator`] of NestedStates and arrays
+pub type NestedArrayIter<'a> =
+    Box<dyn Iterator<Item = Result<(NestedState, Box<dyn Array>)>> + Send + Sync + 'a>;
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/null/mod.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/null/mod.rs
new file mode 100644
index 000000000000..576db09d364b
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/null/mod.rs
@@ -0,0 +1,104 @@
+mod nested;
+
+pub(super) use nested::NestedIter;
+use parquet2::page::Page;
+
+use super::super::{ArrayIter, Pages};
+use crate::array::NullArray;
+use crate::datatypes::DataType;
+
+/// Converts [`Pages`] to an [`ArrayIter`]
+pub fn iter_to_arrays<'a, I>(
+    mut iter: I,
+    data_type: DataType,
+    chunk_size: Option<usize>,
+    num_rows: usize,
+) -> ArrayIter<'a>
+where
+    I: 'a + Pages,
+{
+    let mut len = 0usize;
+
+    while let Ok(Some(page)) = iter.next() {
+        match page {
+            Page::Dict(_) => continue,
+            Page::Data(page) => {
+                let rows = page.num_values();
+                len = (len + rows).min(num_rows);
+                if len == num_rows {
+                    break;
+                }
+            },
+        }
+    }
+
+    if len == 0 {
+        return Box::new(std::iter::empty());
+    }
+
+    let chunk_size = chunk_size.unwrap_or(len);
+
+    let complete_chunks = len / chunk_size;
+
+    let remainder = len - (complete_chunks * chunk_size);
+    let i_data_type = data_type.clone();
+    let complete = (0..complete_chunks)
+        .map(move |_| Ok(NullArray::new(i_data_type.clone(), chunk_size).boxed()));
+    if len % chunk_size == 0 {
+        Box::new(complete)
+    } else {
+        let array = NullArray::new(data_type, remainder);
+        Box::new(complete.chain(std::iter::once(Ok(array.boxed()))))
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use parquet2::encoding::Encoding;
+    use parquet2::error::Error as ParquetError;
+    use parquet2::metadata::Descriptor;
+    use parquet2::page::{DataPage, DataPageHeader, DataPageHeaderV1, Page};
+    use parquet2::schema::types::{PhysicalType, PrimitiveType};
+
+    use super::iter_to_arrays;
+    use crate::array::NullArray;
+    use crate::datatypes::DataType;
+    use crate::error::Error;
+
+    #[test]
+    fn limit() {
+        let new_page = |values: i32| {
+            Page::Data(DataPage::new(
+                DataPageHeader::V1(DataPageHeaderV1 {
+                    num_values: values,
+                    encoding: Encoding::Plain.into(),
+                    definition_level_encoding: Encoding::Plain.into(),
+                    repetition_level_encoding: Encoding::Plain.into(),
+                    statistics: None,
+                }),
+                vec![],
+                Descriptor {
+                    primitive_type: PrimitiveType::from_physical(
+                        "a".to_string(),
+                        PhysicalType::Int32,
+                    ),
+                    max_def_level: 0,
+                    max_rep_level: 0,
+                },
+                None,
+            ))
+        };
+
+        let p1 = new_page(100);
+        let p2 = new_page(100);
+        let pages = vec![Result::<_, ParquetError>::Ok(&p1), Ok(&p2)];
+        let pages = fallible_streaming_iterator::convert(pages.into_iter());
+        let arrays = iter_to_arrays(pages, DataType::Null, Some(10), 101);
+
+        let arrays = arrays.collect::<Result<Vec<_>, Error>>().unwrap();
+        let expected = std::iter::repeat(NullArray::new(DataType::Null, 10).boxed())
+            .take(10)
+            .chain(std::iter::once(NullArray::new(DataType::Null, 1).boxed()));
+        assert_eq!(arrays, expected.collect::<Vec<_>>())
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/null/nested.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/null/nested.rs
new file mode 100644
index 000000000000..9528720e73be
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/null/nested.rs
@@ -0,0 +1,126 @@
+use std::collections::VecDeque;
+
+use parquet2::page::{DataPage, DictPage};
+
+use super::super::nested_utils::*;
+use super::super::{utils, Pages};
+use crate::array::NullArray;
+use crate::datatypes::DataType;
+use crate::error::Result;
+use crate::io::parquet::read::deserialize::utils::DecodedState;
+
+impl<'a> utils::PageState<'a> for usize {
+    fn len(&self) -> usize {
+        *self
+    }
+}
+
+#[derive(Debug)]
+struct NullDecoder {}
+
+impl DecodedState for usize {
+    fn len(&self) -> usize {
+        *self
+    }
+}
+
+impl<'a> NestedDecoder<'a> for NullDecoder {
+    type State = usize;
+    type Dictionary = usize;
+    type DecodedState = usize;
+
+    fn build_state(
+        &self,
+        _page: &'a DataPage,
+        dict: Option<&'a Self::Dictionary>,
+    ) -> Result<Self::State> {
+        if let Some(n) = dict {
+            return Ok(*n);
+        }
+        Ok(1)
+    }
+
+    /// Initializes a new state
+    fn with_capacity(&self, _capacity: usize) -> Self::DecodedState {
+        0
+    }
+
+    fn push_valid(&self, state: &mut Self::State, decoded: &mut Self::DecodedState) -> Result<()> {
+        *decoded += *state;
+        Ok(())
+    }
+
+    fn push_null(&self, decoded: &mut Self::DecodedState) {
+        let length = decoded;
+        *length += 1;
+    }
+
+    fn deserialize_dict(&self, page: &DictPage) -> Self::Dictionary {
+        page.num_values
+    }
+}
+
+/// An iterator adapter over [`Pages`] assumed to be encoded as null arrays
+#[derive(Debug)]
+pub struct NestedIter<I>
+where
+    I: Pages,
+{
+    iter: I,
+    init: Vec<InitNested>,
+    data_type: DataType,
+    items: VecDeque<(NestedState, usize)>,
+    remaining: usize,
+    chunk_size: Option<usize>,
+    decoder: NullDecoder,
+}
+
+impl<I> NestedIter<I>
+where
+    I: Pages,
+{
+    pub fn new(
+        iter: I,
+        init: Vec<InitNested>,
+        data_type: DataType,
+        num_rows: usize,
+        chunk_size: Option<usize>,
+    ) -> Self {
+        Self {
+            iter,
+            init,
+            data_type,
+            items: VecDeque::new(),
+            chunk_size,
+            remaining: num_rows,
+            decoder: NullDecoder {},
+        }
+    }
+}
+
+impl<I> Iterator for NestedIter<I>
+where
+    I: Pages,
+{
+    type Item = Result<(NestedState, NullArray)>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        let maybe_state = next(
+            &mut self.iter,
+            &mut self.items,
+            &mut None,
+            &mut self.remaining,
+            &self.init,
+            self.chunk_size,
+            &self.decoder,
+        );
+        match maybe_state {
+            utils::MaybeNext::Some(Ok((nested, state))) => {
+                Some(Ok((nested, NullArray::new(self.data_type.clone(), state))))
+            },
+            utils::MaybeNext::Some(Err(e)) => Some(Err(e)),
+            utils::MaybeNext::None => None,
+            utils::MaybeNext::More => self.next(),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/primitive/basic.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/primitive/basic.rs
new file mode 100644
index 000000000000..200c9a517dd0
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/primitive/basic.rs
@@ -0,0 +1,370 @@
+use std::collections::VecDeque;
+
+use parquet2::deserialize::SliceFilteredIter;
+use parquet2::encoding::{hybrid_rle, Encoding};
+use parquet2::page::{split_buffer, DataPage, DictPage};
+use parquet2::schema::Repetition;
+use parquet2::types::{decode, NativeType as ParquetNativeType};
+
+use super::super::utils::{get_selected_rows, FilteredOptionalPageValidity, OptionalPageValidity};
+use super::super::{utils, Pages};
+use crate::array::MutablePrimitiveArray;
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::DataType;
+use crate::error::Result;
+use crate::types::NativeType;
+
+#[derive(Debug)]
+pub(super) struct FilteredRequiredValues<'a> {
+    values: SliceFilteredIter<std::slice::ChunksExact<'a, u8>>,
+}
+
+impl<'a> FilteredRequiredValues<'a> {
+    pub fn try_new<P: ParquetNativeType>(page: &'a DataPage) -> Result<Self> {
+        let (_, _, values) = split_buffer(page)?;
+        assert_eq!(values.len() % std::mem::size_of::<P>(), 0);
+
+        let values = values.chunks_exact(std::mem::size_of::<P>());
+
+        let rows = get_selected_rows(page);
+        let values = SliceFilteredIter::new(values, rows);
+
+        Ok(Self { values })
+    }
+
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.values.size_hint().0
+    }
+}
+
+#[derive(Debug)]
+pub(super) struct Values<'a> {
+    pub values: std::slice::ChunksExact<'a, u8>,
+}
+
+impl<'a> Values<'a> {
+    pub fn try_new<P: ParquetNativeType>(page: &'a DataPage) -> Result<Self> {
+        let (_, _, values) = split_buffer(page)?;
+        assert_eq!(values.len() % std::mem::size_of::<P>(), 0);
+        Ok(Self {
+            values: values.chunks_exact(std::mem::size_of::<P>()),
+        })
+    }
+
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.values.size_hint().0
+    }
+}
+
+#[derive(Debug)]
+pub(super) struct ValuesDictionary<'a, T>
+where
+    T: NativeType,
+{
+    pub values: hybrid_rle::HybridRleDecoder<'a>,
+    pub dict: &'a Vec<T>,
+}
+
+impl<'a, T> ValuesDictionary<'a, T>
+where
+    T: NativeType,
+{
+    pub fn try_new(page: &'a DataPage, dict: &'a Vec<T>) -> Result<Self> {
+        let values = utils::dict_indices_decoder(page)?;
+
+        Ok(Self { dict, values })
+    }
+
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.values.size_hint().0
+    }
+}
+
+// The state of a `DataPage` of `Primitive` parquet primitive type
+#[derive(Debug)]
+pub(super) enum State<'a, T>
+where
+    T: NativeType,
+{
+    Optional(OptionalPageValidity<'a>, Values<'a>),
+    Required(Values<'a>),
+    RequiredDictionary(ValuesDictionary<'a, T>),
+    OptionalDictionary(OptionalPageValidity<'a>, ValuesDictionary<'a, T>),
+    FilteredRequired(FilteredRequiredValues<'a>),
+    FilteredOptional(FilteredOptionalPageValidity<'a>, Values<'a>),
+}
+
+impl<'a, T> utils::PageState<'a> for State<'a, T>
+where
+    T: NativeType,
+{
+    fn len(&self) -> usize {
+        match self {
+            State::Optional(optional, _) => optional.len(),
+            State::Required(values) => values.len(),
+            State::RequiredDictionary(values) => values.len(),
+            State::OptionalDictionary(optional, _) => optional.len(),
+            State::FilteredRequired(values) => values.len(),
+            State::FilteredOptional(optional, _) => optional.len(),
+        }
+    }
+}
+
+#[derive(Debug)]
+pub(super) struct PrimitiveDecoder<T, P, F>
+where
+    T: NativeType,
+    P: ParquetNativeType,
+    F: Fn(P) -> T,
+{
+    phantom: std::marker::PhantomData<T>,
+    phantom_p: std::marker::PhantomData<P>,
+    pub op: F,
+}
+
+impl<T, P, F> PrimitiveDecoder<T, P, F>
+where
+    T: NativeType,
+    P: ParquetNativeType,
+    F: Fn(P) -> T,
+{
+    #[inline]
+    pub(super) fn new(op: F) -> Self {
+        Self {
+            phantom: std::marker::PhantomData,
+            phantom_p: std::marker::PhantomData,
+            op,
+        }
+    }
+}
+
+impl<T: std::fmt::Debug> utils::DecodedState for (Vec<T>, MutableBitmap) {
+    fn len(&self) -> usize {
+        self.0.len()
+    }
+}
+
+impl<'a, T, P, F> utils::Decoder<'a> for PrimitiveDecoder<T, P, F>
+where
+    T: NativeType,
+    P: ParquetNativeType,
+    F: Copy + Fn(P) -> T,
+{
+    type State = State<'a, T>;
+    type Dict = Vec<T>;
+    type DecodedState = (Vec<T>, MutableBitmap);
+
+    fn build_state(&self, page: &'a DataPage, dict: Option<&'a Self::Dict>) -> Result<Self::State> {
+        let is_optional =
+            page.descriptor.primitive_type.field_info.repetition == Repetition::Optional;
+        let is_filtered = page.selected_rows().is_some();
+
+        match (page.encoding(), dict, is_optional, is_filtered) {
+            (Encoding::PlainDictionary | Encoding::RleDictionary, Some(dict), false, false) => {
+                ValuesDictionary::try_new(page, dict).map(State::RequiredDictionary)
+            },
+            (Encoding::PlainDictionary | Encoding::RleDictionary, Some(dict), true, false) => {
+                Ok(State::OptionalDictionary(
+                    OptionalPageValidity::try_new(page)?,
+                    ValuesDictionary::try_new(page, dict)?,
+                ))
+            },
+            (Encoding::Plain, _, true, false) => {
+                let validity = OptionalPageValidity::try_new(page)?;
+                let values = Values::try_new::<P>(page)?;
+
+                Ok(State::Optional(validity, values))
+            },
+            (Encoding::Plain, _, false, false) => Ok(State::Required(Values::try_new::<P>(page)?)),
+            (Encoding::Plain, _, false, true) => {
+                FilteredRequiredValues::try_new::<P>(page).map(State::FilteredRequired)
+            },
+            (Encoding::Plain, _, true, true) => Ok(State::FilteredOptional(
+                FilteredOptionalPageValidity::try_new(page)?,
+                Values::try_new::<P>(page)?,
+            )),
+            _ => Err(utils::not_implemented(page)),
+        }
+    }
+
+    fn with_capacity(&self, capacity: usize) -> Self::DecodedState {
+        (
+            Vec::<T>::with_capacity(capacity),
+            MutableBitmap::with_capacity(capacity),
+        )
+    }
+
+    fn extend_from_state(
+        &self,
+        state: &mut Self::State,
+        decoded: &mut Self::DecodedState,
+        remaining: usize,
+    ) {
+        let (values, validity) = decoded;
+        match state {
+            State::Optional(page_validity, page_values) => utils::extend_from_decoder(
+                validity,
+                page_validity,
+                Some(remaining),
+                values,
+                page_values.values.by_ref().map(decode).map(self.op),
+            ),
+            State::Required(page) => {
+                values.extend(
+                    page.values
+                        .by_ref()
+                        .map(decode)
+                        .map(self.op)
+                        .take(remaining),
+                );
+            },
+            State::OptionalDictionary(page_validity, page_values) => {
+                let op1 = |index: u32| page_values.dict[index as usize];
+                utils::extend_from_decoder(
+                    validity,
+                    page_validity,
+                    Some(remaining),
+                    values,
+                    &mut page_values.values.by_ref().map(|x| x.unwrap()).map(op1),
+                )
+            },
+            State::RequiredDictionary(page) => {
+                let op1 = |index: u32| page.dict[index as usize];
+                values.extend(
+                    page.values
+                        .by_ref()
+                        .map(|x| x.unwrap())
+                        .map(op1)
+                        .take(remaining),
+                );
+            },
+            State::FilteredRequired(page) => {
+                values.extend(
+                    page.values
+                        .by_ref()
+                        .map(decode)
+                        .map(self.op)
+                        .take(remaining),
+                );
+            },
+            State::FilteredOptional(page_validity, page_values) => {
+                utils::extend_from_decoder(
+                    validity,
+                    page_validity,
+                    Some(remaining),
+                    values,
+                    page_values.values.by_ref().map(decode).map(self.op),
+                );
+            },
+        }
+    }
+
+    fn deserialize_dict(&self, page: &DictPage) -> Self::Dict {
+        deserialize_plain(&page.buffer, self.op)
+    }
+}
+
+pub(super) fn finish<T: NativeType>(
+    data_type: &DataType,
+    values: Vec<T>,
+    validity: MutableBitmap,
+) -> MutablePrimitiveArray<T> {
+    let validity = if validity.is_empty() {
+        None
+    } else {
+        Some(validity)
+    };
+    MutablePrimitiveArray::try_new(data_type.clone(), values, validity).unwrap()
+}
+
+/// An [`Iterator`] adapter over [`Pages`] assumed to be encoded as primitive arrays
+#[derive(Debug)]
+pub struct Iter<T, I, P, F>
+where
+    I: Pages,
+    T: NativeType,
+    P: ParquetNativeType,
+    F: Fn(P) -> T,
+{
+    iter: I,
+    data_type: DataType,
+    items: VecDeque<(Vec<T>, MutableBitmap)>,
+    remaining: usize,
+    chunk_size: Option<usize>,
+    dict: Option<Vec<T>>,
+    op: F,
+    phantom: std::marker::PhantomData<P>,
+}
+
+impl<T, I, P, F> Iter<T, I, P, F>
+where
+    I: Pages,
+    T: NativeType,
+
+    P: ParquetNativeType,
+    F: Copy + Fn(P) -> T,
+{
+    pub fn new(
+        iter: I,
+        data_type: DataType,
+        num_rows: usize,
+        chunk_size: Option<usize>,
+        op: F,
+    ) -> Self {
+        Self {
+            iter,
+            data_type,
+            items: VecDeque::new(),
+            dict: None,
+            remaining: num_rows,
+            chunk_size,
+            op,
+            phantom: Default::default(),
+        }
+    }
+}
+
+impl<T, I, P, F> Iterator for Iter<T, I, P, F>
+where
+    I: Pages,
+    T: NativeType,
+    P: ParquetNativeType,
+    F: Copy + Fn(P) -> T,
+{
+    type Item = Result<MutablePrimitiveArray<T>>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        let maybe_state = utils::next(
+            &mut self.iter,
+            &mut self.items,
+            &mut self.dict,
+            &mut self.remaining,
+            self.chunk_size,
+            &PrimitiveDecoder::new(self.op),
+        );
+        match maybe_state {
+            utils::MaybeNext::Some(Ok((values, validity))) => {
+                Some(Ok(finish(&self.data_type, values, validity)))
+            },
+            utils::MaybeNext::Some(Err(e)) => Some(Err(e)),
+            utils::MaybeNext::None => None,
+            utils::MaybeNext::More => self.next(),
+        }
+    }
+}
+
+pub(super) fn deserialize_plain<T, P, F>(values: &[u8], op: F) -> Vec<T>
+where
+    T: NativeType,
+    P: ParquetNativeType,
+    F: Copy + Fn(P) -> T,
+{
+    values
+        .chunks_exact(std::mem::size_of::<P>())
+        .map(decode)
+        .map(op)
+        .collect::<Vec<_>>()
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/primitive/dictionary.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/primitive/dictionary.rs
new file mode 100644
index 000000000000..35293d582d10
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/primitive/dictionary.rs
@@ -0,0 +1,190 @@
+use std::collections::VecDeque;
+
+use parquet2::page::DictPage;
+use parquet2::types::NativeType as ParquetNativeType;
+
+use super::super::dictionary::{nested_next_dict, *};
+use super::super::nested_utils::{InitNested, NestedState};
+use super::super::utils::MaybeNext;
+use super::super::Pages;
+use super::basic::deserialize_plain;
+use crate::array::{Array, DictionaryArray, DictionaryKey, PrimitiveArray};
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::DataType;
+use crate::error::Result;
+use crate::types::NativeType;
+
+fn read_dict<P, T, F>(data_type: DataType, op: F, dict: &DictPage) -> Box<dyn Array>
+where
+    T: NativeType,
+    P: ParquetNativeType,
+    F: Copy + Fn(P) -> T,
+{
+    let data_type = match data_type {
+        DataType::Dictionary(_, values, _) => *values,
+        _ => data_type,
+    };
+    let values = deserialize_plain(&dict.buffer, op);
+
+    Box::new(PrimitiveArray::new(data_type, values.into(), None))
+}
+
+/// An iterator adapter over [`Pages`] assumed to be encoded as boolean arrays
+#[derive(Debug)]
+pub struct DictIter<K, T, I, P, F>
+where
+    I: Pages,
+    T: NativeType,
+    K: DictionaryKey,
+    P: ParquetNativeType,
+    F: Fn(P) -> T,
+{
+    iter: I,
+    data_type: DataType,
+    values: Option<Box<dyn Array>>,
+    items: VecDeque<(Vec<K>, MutableBitmap)>,
+    remaining: usize,
+    chunk_size: Option<usize>,
+    op: F,
+    phantom: std::marker::PhantomData<P>,
+}
+
+impl<K, T, I, P, F> DictIter<K, T, I, P, F>
+where
+    K: DictionaryKey,
+    I: Pages,
+    T: NativeType,
+
+    P: ParquetNativeType,
+    F: Copy + Fn(P) -> T,
+{
+    pub fn new(
+        iter: I,
+        data_type: DataType,
+        num_rows: usize,
+        chunk_size: Option<usize>,
+        op: F,
+    ) -> Self {
+        Self {
+            iter,
+            data_type,
+            values: None,
+            items: VecDeque::new(),
+            chunk_size,
+            remaining: num_rows,
+            op,
+            phantom: Default::default(),
+        }
+    }
+}
+
+impl<K, T, I, P, F> Iterator for DictIter<K, T, I, P, F>
+where
+    I: Pages,
+    T: NativeType,
+    K: DictionaryKey,
+    P: ParquetNativeType,
+    F: Copy + Fn(P) -> T,
+{
+    type Item = Result<DictionaryArray<K>>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        let maybe_state = next_dict(
+            &mut self.iter,
+            &mut self.items,
+            &mut self.values,
+            self.data_type.clone(),
+            &mut self.remaining,
+            self.chunk_size,
+            |dict| read_dict::<P, T, _>(self.data_type.clone(), self.op, dict),
+        );
+        match maybe_state {
+            MaybeNext::Some(Ok(dict)) => Some(Ok(dict)),
+            MaybeNext::Some(Err(e)) => Some(Err(e)),
+            MaybeNext::None => None,
+            MaybeNext::More => self.next(),
+        }
+    }
+}
+
+/// An iterator adapter that converts [`DataPages`] into an [`Iterator`] of [`DictionaryArray`]
+#[derive(Debug)]
+pub struct NestedDictIter<K, T, I, P, F>
+where
+    I: Pages,
+    T: NativeType,
+    K: DictionaryKey,
+    P: ParquetNativeType,
+    F: Fn(P) -> T,
+{
+    iter: I,
+    init: Vec<InitNested>,
+    data_type: DataType,
+    values: Option<Box<dyn Array>>,
+    items: VecDeque<(NestedState, (Vec<K>, MutableBitmap))>,
+    remaining: usize,
+    chunk_size: Option<usize>,
+    op: F,
+    phantom: std::marker::PhantomData<P>,
+}
+
+impl<K, T, I, P, F> NestedDictIter<K, T, I, P, F>
+where
+    K: DictionaryKey,
+    I: Pages,
+    T: NativeType,
+
+    P: ParquetNativeType,
+    F: Copy + Fn(P) -> T,
+{
+    pub fn new(
+        iter: I,
+        init: Vec<InitNested>,
+        data_type: DataType,
+        num_rows: usize,
+        chunk_size: Option<usize>,
+        op: F,
+    ) -> Self {
+        Self {
+            iter,
+            init,
+            data_type,
+            values: None,
+            items: VecDeque::new(),
+            remaining: num_rows,
+            chunk_size,
+            op,
+            phantom: Default::default(),
+        }
+    }
+}
+
+impl<K, T, I, P, F> Iterator for NestedDictIter<K, T, I, P, F>
+where
+    I: Pages,
+    T: NativeType,
+    K: DictionaryKey,
+    P: ParquetNativeType,
+    F: Copy + Fn(P) -> T,
+{
+    type Item = Result<(NestedState, DictionaryArray<K>)>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        let maybe_state = nested_next_dict(
+            &mut self.iter,
+            &mut self.items,
+            &mut self.remaining,
+            &self.init,
+            &mut self.values,
+            self.data_type.clone(),
+            self.chunk_size,
+            |dict| read_dict::<P, T, _>(self.data_type.clone(), self.op, dict),
+        );
+        match maybe_state {
+            MaybeNext::Some(Ok(dict)) => Some(Ok(dict)),
+            MaybeNext::Some(Err(e)) => Some(Err(e)),
+            MaybeNext::None => None,
+            MaybeNext::More => self.next(),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/primitive/integer.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/primitive/integer.rs
new file mode 100644
index 000000000000..ac6c0bac0c1f
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/primitive/integer.rs
@@ -0,0 +1,262 @@
+use std::collections::VecDeque;
+
+use num_traits::AsPrimitive;
+use parquet2::deserialize::SliceFilteredIter;
+use parquet2::encoding::delta_bitpacked::Decoder;
+use parquet2::encoding::Encoding;
+use parquet2::page::{split_buffer, DataPage, DictPage};
+use parquet2::schema::Repetition;
+use parquet2::types::NativeType as ParquetNativeType;
+
+use super::super::{utils, Pages};
+use super::basic::{finish, PrimitiveDecoder, State as PrimitiveState};
+use crate::array::MutablePrimitiveArray;
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+use crate::io::parquet::read::deserialize::utils::{
+    get_selected_rows, FilteredOptionalPageValidity, OptionalPageValidity,
+};
+use crate::types::NativeType;
+
+/// The state of a [`DataPage`] of an integer parquet type (i32 or i64)
+#[derive(Debug)]
+enum State<'a, T>
+where
+    T: NativeType,
+{
+    Common(PrimitiveState<'a, T>),
+    DeltaBinaryPackedRequired(Decoder<'a>),
+    DeltaBinaryPackedOptional(OptionalPageValidity<'a>, Decoder<'a>),
+    FilteredDeltaBinaryPackedRequired(SliceFilteredIter<Decoder<'a>>),
+    FilteredDeltaBinaryPackedOptional(FilteredOptionalPageValidity<'a>, Decoder<'a>),
+}
+
+impl<'a, T> utils::PageState<'a> for State<'a, T>
+where
+    T: NativeType,
+{
+    fn len(&self) -> usize {
+        match self {
+            State::Common(state) => state.len(),
+            State::DeltaBinaryPackedRequired(state) => state.size_hint().0,
+            State::DeltaBinaryPackedOptional(state, _) => state.len(),
+            State::FilteredDeltaBinaryPackedRequired(state) => state.size_hint().0,
+            State::FilteredDeltaBinaryPackedOptional(state, _) => state.len(),
+        }
+    }
+}
+
+/// Decoder of integer parquet type
+#[derive(Debug)]
+struct IntDecoder<T, P, F>(PrimitiveDecoder<T, P, F>)
+where
+    T: NativeType,
+    P: ParquetNativeType,
+    i64: num_traits::AsPrimitive<P>,
+    F: Fn(P) -> T;
+
+impl<T, P, F> IntDecoder<T, P, F>
+where
+    T: NativeType,
+    P: ParquetNativeType,
+    i64: num_traits::AsPrimitive<P>,
+    F: Fn(P) -> T,
+{
+    #[inline]
+    fn new(op: F) -> Self {
+        Self(PrimitiveDecoder::new(op))
+    }
+}
+
+impl<'a, T, P, F> utils::Decoder<'a> for IntDecoder<T, P, F>
+where
+    T: NativeType,
+    P: ParquetNativeType,
+    i64: num_traits::AsPrimitive<P>,
+    F: Copy + Fn(P) -> T,
+{
+    type State = State<'a, T>;
+    type Dict = Vec<T>;
+    type DecodedState = (Vec<T>, MutableBitmap);
+
+    fn build_state(&self, page: &'a DataPage, dict: Option<&'a Self::Dict>) -> Result<Self::State> {
+        let is_optional =
+            page.descriptor.primitive_type.field_info.repetition == Repetition::Optional;
+        let is_filtered = page.selected_rows().is_some();
+
+        match (page.encoding(), dict, is_optional, is_filtered) {
+            (Encoding::DeltaBinaryPacked, _, false, false) => {
+                let (_, _, values) = split_buffer(page)?;
+                Decoder::try_new(values)
+                    .map(State::DeltaBinaryPackedRequired)
+                    .map_err(Error::from)
+            },
+            (Encoding::DeltaBinaryPacked, _, true, false) => {
+                let (_, _, values) = split_buffer(page)?;
+                Ok(State::DeltaBinaryPackedOptional(
+                    OptionalPageValidity::try_new(page)?,
+                    Decoder::try_new(values)?,
+                ))
+            },
+            (Encoding::DeltaBinaryPacked, _, false, true) => {
+                let (_, _, values) = split_buffer(page)?;
+                let values = Decoder::try_new(values)?;
+
+                let rows = get_selected_rows(page);
+                let values = SliceFilteredIter::new(values, rows);
+
+                Ok(State::FilteredDeltaBinaryPackedRequired(values))
+            },
+            (Encoding::DeltaBinaryPacked, _, true, true) => {
+                let (_, _, values) = split_buffer(page)?;
+                let values = Decoder::try_new(values)?;
+
+                Ok(State::FilteredDeltaBinaryPackedOptional(
+                    FilteredOptionalPageValidity::try_new(page)?,
+                    values,
+                ))
+            },
+            _ => self.0.build_state(page, dict).map(State::Common),
+        }
+    }
+
+    fn with_capacity(&self, capacity: usize) -> Self::DecodedState {
+        self.0.with_capacity(capacity)
+    }
+
+    fn extend_from_state(
+        &self,
+        state: &mut Self::State,
+        decoded: &mut Self::DecodedState,
+        remaining: usize,
+    ) {
+        let (values, validity) = decoded;
+        match state {
+            State::Common(state) => self.0.extend_from_state(state, decoded, remaining),
+            State::DeltaBinaryPackedRequired(state) => {
+                values.extend(
+                    state
+                        .by_ref()
+                        .map(|x| x.unwrap().as_())
+                        .map(self.0.op)
+                        .take(remaining),
+                );
+            },
+            State::DeltaBinaryPackedOptional(page_validity, page_values) => {
+                utils::extend_from_decoder(
+                    validity,
+                    page_validity,
+                    Some(remaining),
+                    values,
+                    page_values
+                        .by_ref()
+                        .map(|x| x.unwrap().as_())
+                        .map(self.0.op),
+                )
+            },
+            State::FilteredDeltaBinaryPackedRequired(page) => {
+                values.extend(
+                    page.by_ref()
+                        .map(|x| x.unwrap().as_())
+                        .map(self.0.op)
+                        .take(remaining),
+                );
+            },
+            State::FilteredDeltaBinaryPackedOptional(page_validity, page_values) => {
+                utils::extend_from_decoder(
+                    validity,
+                    page_validity,
+                    Some(remaining),
+                    values,
+                    page_values
+                        .by_ref()
+                        .map(|x| x.unwrap().as_())
+                        .map(self.0.op),
+                );
+            },
+        }
+    }
+
+    fn deserialize_dict(&self, page: &DictPage) -> Self::Dict {
+        self.0.deserialize_dict(page)
+    }
+}
+
+/// An [`Iterator`] adapter over [`Pages`] assumed to be encoded as primitive arrays
+/// encoded as parquet integer types
+#[derive(Debug)]
+pub struct IntegerIter<T, I, P, F>
+where
+    I: Pages,
+    T: NativeType,
+    P: ParquetNativeType,
+    F: Fn(P) -> T,
+{
+    iter: I,
+    data_type: DataType,
+    items: VecDeque<(Vec<T>, MutableBitmap)>,
+    remaining: usize,
+    chunk_size: Option<usize>,
+    dict: Option<Vec<T>>,
+    op: F,
+    phantom: std::marker::PhantomData<P>,
+}
+
+impl<T, I, P, F> IntegerIter<T, I, P, F>
+where
+    I: Pages,
+    T: NativeType,
+
+    P: ParquetNativeType,
+    F: Copy + Fn(P) -> T,
+{
+    pub fn new(
+        iter: I,
+        data_type: DataType,
+        num_rows: usize,
+        chunk_size: Option<usize>,
+        op: F,
+    ) -> Self {
+        Self {
+            iter,
+            data_type,
+            items: VecDeque::new(),
+            dict: None,
+            remaining: num_rows,
+            chunk_size,
+            op,
+            phantom: Default::default(),
+        }
+    }
+}
+
+impl<T, I, P, F> Iterator for IntegerIter<T, I, P, F>
+where
+    I: Pages,
+    T: NativeType,
+    P: ParquetNativeType,
+    i64: num_traits::AsPrimitive<P>,
+    F: Copy + Fn(P) -> T,
+{
+    type Item = Result<MutablePrimitiveArray<T>>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        let maybe_state = utils::next(
+            &mut self.iter,
+            &mut self.items,
+            &mut self.dict,
+            &mut self.remaining,
+            self.chunk_size,
+            &IntDecoder::new(self.op),
+        );
+        match maybe_state {
+            utils::MaybeNext::Some(Ok((values, validity))) => {
+                Some(Ok(finish(&self.data_type, values, validity)))
+            },
+            utils::MaybeNext::Some(Err(e)) => Some(Err(e)),
+            utils::MaybeNext::None => None,
+            utils::MaybeNext::More => self.next(),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/primitive/mod.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/primitive/mod.rs
new file mode 100644
index 000000000000..27d9c27c3186
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/primitive/mod.rs
@@ -0,0 +1,9 @@
+mod basic;
+mod dictionary;
+mod integer;
+mod nested;
+
+pub use basic::Iter;
+pub use dictionary::{DictIter, NestedDictIter};
+pub use integer::IntegerIter;
+pub use nested::NestedIter;
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/primitive/nested.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/primitive/nested.rs
new file mode 100644
index 000000000000..405e2d9a7c09
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/primitive/nested.rs
@@ -0,0 +1,244 @@
+use std::collections::VecDeque;
+
+use parquet2::encoding::Encoding;
+use parquet2::page::{DataPage, DictPage};
+use parquet2::schema::Repetition;
+use parquet2::types::{decode, NativeType as ParquetNativeType};
+
+use super::super::nested_utils::*;
+use super::super::{utils, Pages};
+use super::basic::{deserialize_plain, Values, ValuesDictionary};
+use crate::array::PrimitiveArray;
+use crate::bitmap::MutableBitmap;
+use crate::datatypes::DataType;
+use crate::error::Result;
+use crate::types::NativeType;
+
+// The state of a `DataPage` of `Primitive` parquet primitive type
+#[allow(clippy::large_enum_variant)]
+#[derive(Debug)]
+enum State<'a, T>
+where
+    T: NativeType,
+{
+    Optional(Values<'a>),
+    Required(Values<'a>),
+    RequiredDictionary(ValuesDictionary<'a, T>),
+    OptionalDictionary(ValuesDictionary<'a, T>),
+}
+
+impl<'a, T> utils::PageState<'a> for State<'a, T>
+where
+    T: NativeType,
+{
+    fn len(&self) -> usize {
+        match self {
+            State::Optional(values) => values.len(),
+            State::Required(values) => values.len(),
+            State::RequiredDictionary(values) => values.len(),
+            State::OptionalDictionary(values) => values.len(),
+        }
+    }
+}
+
+#[derive(Debug)]
+struct PrimitiveDecoder<T, P, F>
+where
+    T: NativeType,
+    P: ParquetNativeType,
+    F: Fn(P) -> T,
+{
+    phantom: std::marker::PhantomData<T>,
+    phantom_p: std::marker::PhantomData<P>,
+    op: F,
+}
+
+impl<T, P, F> PrimitiveDecoder<T, P, F>
+where
+    T: NativeType,
+    P: ParquetNativeType,
+    F: Fn(P) -> T,
+{
+    #[inline]
+    fn new(op: F) -> Self {
+        Self {
+            phantom: std::marker::PhantomData,
+            phantom_p: std::marker::PhantomData,
+            op,
+        }
+    }
+}
+
+impl<'a, T, P, F> NestedDecoder<'a> for PrimitiveDecoder<T, P, F>
+where
+    T: NativeType,
+    P: ParquetNativeType,
+    F: Copy + Fn(P) -> T,
+{
+    type State = State<'a, T>;
+    type Dictionary = Vec<T>;
+    type DecodedState = (Vec<T>, MutableBitmap);
+
+    fn build_state(
+        &self,
+        page: &'a DataPage,
+        dict: Option<&'a Self::Dictionary>,
+    ) -> Result<Self::State> {
+        let is_optional =
+            page.descriptor.primitive_type.field_info.repetition == Repetition::Optional;
+        let is_filtered = page.selected_rows().is_some();
+
+        match (page.encoding(), dict, is_optional, is_filtered) {
+            (Encoding::PlainDictionary | Encoding::RleDictionary, Some(dict), false, false) => {
+                ValuesDictionary::try_new(page, dict).map(State::RequiredDictionary)
+            },
+            (Encoding::PlainDictionary | Encoding::RleDictionary, Some(dict), true, false) => {
+                ValuesDictionary::try_new(page, dict).map(State::OptionalDictionary)
+            },
+            (Encoding::Plain, _, true, false) => Values::try_new::<P>(page).map(State::Optional),
+            (Encoding::Plain, _, false, false) => Values::try_new::<P>(page).map(State::Required),
+            _ => Err(utils::not_implemented(page)),
+        }
+    }
+
+    /// Initializes a new state
+    fn with_capacity(&self, capacity: usize) -> Self::DecodedState {
+        (
+            Vec::<T>::with_capacity(capacity),
+            MutableBitmap::with_capacity(capacity),
+        )
+    }
+
+    fn push_valid(&self, state: &mut Self::State, decoded: &mut Self::DecodedState) -> Result<()> {
+        let (values, validity) = decoded;
+        match state {
+            State::Optional(page_values) => {
+                let value = page_values.values.by_ref().next().map(decode).map(self.op);
+                // convert unwrap to error
+                values.push(value.unwrap_or_default());
+                validity.push(true);
+            },
+            State::Required(page_values) => {
+                let value = page_values.values.by_ref().next().map(decode).map(self.op);
+                // convert unwrap to error
+                values.push(value.unwrap_or_default());
+            },
+            State::RequiredDictionary(page) => {
+                let value = page
+                    .values
+                    .next()
+                    .map(|index| page.dict[index.unwrap() as usize]);
+
+                values.push(value.unwrap_or_default());
+            },
+            State::OptionalDictionary(page) => {
+                let value = page
+                    .values
+                    .next()
+                    .map(|index| page.dict[index.unwrap() as usize]);
+
+                values.push(value.unwrap_or_default());
+                validity.push(true);
+            },
+        }
+        Ok(())
+    }
+
+    fn push_null(&self, decoded: &mut Self::DecodedState) {
+        let (values, validity) = decoded;
+        values.push(T::default());
+        validity.push(false)
+    }
+
+    fn deserialize_dict(&self, page: &DictPage) -> Self::Dictionary {
+        deserialize_plain(&page.buffer, self.op)
+    }
+}
+
+fn finish<T: NativeType>(
+    data_type: &DataType,
+    values: Vec<T>,
+    validity: MutableBitmap,
+) -> PrimitiveArray<T> {
+    PrimitiveArray::new(data_type.clone(), values.into(), validity.into())
+}
+
+/// An iterator adapter over [`Pages`] assumed to be encoded as boolean arrays
+#[derive(Debug)]
+pub struct NestedIter<T, I, P, F>
+where
+    I: Pages,
+    T: NativeType,
+
+    P: ParquetNativeType,
+    F: Copy + Fn(P) -> T,
+{
+    iter: I,
+    init: Vec<InitNested>,
+    data_type: DataType,
+    items: VecDeque<(NestedState, (Vec<T>, MutableBitmap))>,
+    dict: Option<Vec<T>>,
+    remaining: usize,
+    chunk_size: Option<usize>,
+    decoder: PrimitiveDecoder<T, P, F>,
+}
+
+impl<T, I, P, F> NestedIter<T, I, P, F>
+where
+    I: Pages,
+    T: NativeType,
+
+    P: ParquetNativeType,
+    F: Copy + Fn(P) -> T,
+{
+    pub fn new(
+        iter: I,
+        init: Vec<InitNested>,
+        data_type: DataType,
+        num_rows: usize,
+        chunk_size: Option<usize>,
+        op: F,
+    ) -> Self {
+        Self {
+            iter,
+            init,
+            data_type,
+            items: VecDeque::new(),
+            dict: None,
+            chunk_size,
+            remaining: num_rows,
+            decoder: PrimitiveDecoder::new(op),
+        }
+    }
+}
+
+impl<T, I, P, F> Iterator for NestedIter<T, I, P, F>
+where
+    I: Pages,
+    T: NativeType,
+
+    P: ParquetNativeType,
+    F: Copy + Fn(P) -> T,
+{
+    type Item = Result<(NestedState, PrimitiveArray<T>)>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        let maybe_state = next(
+            &mut self.iter,
+            &mut self.items,
+            &mut self.dict,
+            &mut self.remaining,
+            &self.init,
+            self.chunk_size,
+            &self.decoder,
+        );
+        match maybe_state {
+            utils::MaybeNext::Some(Ok((nested, state))) => {
+                Some(Ok((nested, finish(&self.data_type, state.0, state.1))))
+            },
+            utils::MaybeNext::Some(Err(e)) => Some(Err(e)),
+            utils::MaybeNext::None => None,
+            utils::MaybeNext::More => self.next(),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/simple.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/simple.rs
new file mode 100644
index 000000000000..83d9d8fbae8a
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/simple.rs
@@ -0,0 +1,651 @@
+use ethnum::I256;
+use parquet2::schema::types::{
+    PhysicalType, PrimitiveLogicalType, PrimitiveType, TimeUnit as ParquetTimeUnit,
+};
+use parquet2::types::int96_to_i64_ns;
+
+use super::super::{ArrayIter, Pages};
+use super::{binary, boolean, fixed_size_binary, null, primitive};
+use crate::array::{Array, DictionaryKey, MutablePrimitiveArray, PrimitiveArray};
+use crate::datatypes::{DataType, IntervalUnit, TimeUnit};
+use crate::error::{Error, Result};
+use crate::types::{days_ms, i256, NativeType};
+
+/// Converts an iterator of arrays to a trait object returning trait objects
+#[inline]
+fn dyn_iter<'a, A, I>(iter: I) -> ArrayIter<'a>
+where
+    A: Array,
+    I: Iterator<Item = Result<A>> + Send + Sync + 'a,
+{
+    Box::new(iter.map(|x| x.map(|x| Box::new(x) as Box<dyn Array>)))
+}
+
+/// Converts an iterator of [MutablePrimitiveArray] into an iterator of [PrimitiveArray]
+#[inline]
+fn iden<T, I>(iter: I) -> impl Iterator<Item = Result<PrimitiveArray<T>>>
+where
+    T: NativeType,
+    I: Iterator<Item = Result<MutablePrimitiveArray<T>>>,
+{
+    iter.map(|x| x.map(|x| x.into()))
+}
+
+#[inline]
+fn op<T, I, F>(iter: I, op: F) -> impl Iterator<Item = Result<PrimitiveArray<T>>>
+where
+    T: NativeType,
+    I: Iterator<Item = Result<MutablePrimitiveArray<T>>>,
+    F: Fn(T) -> T + Copy,
+{
+    iter.map(move |x| {
+        x.map(move |mut x| {
+            x.values_mut_slice().iter_mut().for_each(|x| *x = op(*x));
+            x.into()
+        })
+    })
+}
+
+/// An iterator adapter that maps an iterator of Pages into an iterator of Arrays
+/// of [`DataType`] `data_type` and length `chunk_size`.
+pub fn page_iter_to_arrays<'a, I: Pages + 'a>(
+    pages: I,
+    type_: &PrimitiveType,
+    data_type: DataType,
+    chunk_size: Option<usize>,
+    num_rows: usize,
+) -> Result<ArrayIter<'a>> {
+    use DataType::*;
+
+    let physical_type = &type_.physical_type;
+    let logical_type = &type_.logical_type;
+
+    Ok(match (physical_type, data_type.to_logical_type()) {
+        (_, Null) => null::iter_to_arrays(pages, data_type, chunk_size, num_rows),
+        (PhysicalType::Boolean, Boolean) => {
+            dyn_iter(boolean::Iter::new(pages, data_type, chunk_size, num_rows))
+        },
+        (PhysicalType::Int32, UInt8) => dyn_iter(iden(primitive::IntegerIter::new(
+            pages,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i32| x as u8,
+        ))),
+        (PhysicalType::Int32, UInt16) => dyn_iter(iden(primitive::IntegerIter::new(
+            pages,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i32| x as u16,
+        ))),
+        (PhysicalType::Int32, UInt32) => dyn_iter(iden(primitive::IntegerIter::new(
+            pages,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i32| x as u32,
+        ))),
+        (PhysicalType::Int64, UInt32) => dyn_iter(iden(primitive::IntegerIter::new(
+            pages,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i64| x as u32,
+        ))),
+        (PhysicalType::Int32, Int8) => dyn_iter(iden(primitive::IntegerIter::new(
+            pages,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i32| x as i8,
+        ))),
+        (PhysicalType::Int32, Int16) => dyn_iter(iden(primitive::IntegerIter::new(
+            pages,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i32| x as i16,
+        ))),
+        (PhysicalType::Int32, Int32 | Date32 | Time32(_)) => dyn_iter(iden(
+            primitive::IntegerIter::new(pages, data_type, num_rows, chunk_size, |x: i32| x),
+        )),
+        (PhysicalType::Int64 | PhysicalType::Int96, Timestamp(time_unit, _)) => {
+            let time_unit = *time_unit;
+            return timestamp(
+                pages,
+                physical_type,
+                logical_type,
+                data_type,
+                num_rows,
+                chunk_size,
+                time_unit,
+            );
+        },
+        (PhysicalType::FixedLenByteArray(_), FixedSizeBinary(_)) => dyn_iter(
+            fixed_size_binary::Iter::new(pages, data_type, num_rows, chunk_size),
+        ),
+        (PhysicalType::FixedLenByteArray(12), Interval(IntervalUnit::YearMonth)) => {
+            let n = 12;
+            let pages = fixed_size_binary::Iter::new(
+                pages,
+                DataType::FixedSizeBinary(n),
+                num_rows,
+                chunk_size,
+            );
+
+            let pages = pages.map(move |maybe_array| {
+                let array = maybe_array?;
+                let values = array
+                    .values()
+                    .chunks_exact(n)
+                    .map(|value: &[u8]| i32::from_le_bytes(value[..4].try_into().unwrap()))
+                    .collect::<Vec<_>>();
+                let validity = array.validity().cloned();
+
+                PrimitiveArray::<i32>::try_new(data_type.clone(), values.into(), validity)
+            });
+
+            let arrays = pages.map(|x| x.map(|x| x.boxed()));
+
+            Box::new(arrays) as _
+        },
+        (PhysicalType::FixedLenByteArray(12), Interval(IntervalUnit::DayTime)) => {
+            let n = 12;
+            let pages = fixed_size_binary::Iter::new(
+                pages,
+                DataType::FixedSizeBinary(n),
+                num_rows,
+                chunk_size,
+            );
+
+            let pages = pages.map(move |maybe_array| {
+                let array = maybe_array?;
+                let values = array
+                    .values()
+                    .chunks_exact(n)
+                    .map(super::super::convert_days_ms)
+                    .collect::<Vec<_>>();
+                let validity = array.validity().cloned();
+
+                PrimitiveArray::<days_ms>::try_new(data_type.clone(), values.into(), validity)
+            });
+
+            let arrays = pages.map(|x| x.map(|x| x.boxed()));
+
+            Box::new(arrays) as _
+        },
+        (PhysicalType::Int32, Decimal(_, _)) => dyn_iter(iden(primitive::IntegerIter::new(
+            pages,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i32| x as i128,
+        ))),
+        (PhysicalType::Int64, Decimal(_, _)) => dyn_iter(iden(primitive::IntegerIter::new(
+            pages,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i64| x as i128,
+        ))),
+        (PhysicalType::FixedLenByteArray(n), Decimal(_, _)) if *n > 16 => {
+            return Err(Error::NotYetImplemented(format!(
+                "Can't decode Decimal128 type from Fixed Size Byte Array of len {n:?}"
+            )))
+        },
+        (PhysicalType::FixedLenByteArray(n), Decimal(_, _)) => {
+            let n = *n;
+
+            let pages = fixed_size_binary::Iter::new(
+                pages,
+                DataType::FixedSizeBinary(n),
+                num_rows,
+                chunk_size,
+            );
+
+            let pages = pages.map(move |maybe_array| {
+                let array = maybe_array?;
+                let values = array
+                    .values()
+                    .chunks_exact(n)
+                    .map(|value: &[u8]| super::super::convert_i128(value, n))
+                    .collect::<Vec<_>>();
+                let validity = array.validity().cloned();
+
+                PrimitiveArray::<i128>::try_new(data_type.clone(), values.into(), validity)
+            });
+
+            let arrays = pages.map(|x| x.map(|x| x.boxed()));
+
+            Box::new(arrays) as _
+        },
+        (PhysicalType::Int32, Decimal256(_, _)) => dyn_iter(iden(primitive::IntegerIter::new(
+            pages,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i32| i256(I256::new(x as i128)),
+        ))),
+        (PhysicalType::Int64, Decimal256(_, _)) => dyn_iter(iden(primitive::IntegerIter::new(
+            pages,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i64| i256(I256::new(x as i128)),
+        ))),
+        (PhysicalType::FixedLenByteArray(n), Decimal256(_, _)) if *n <= 16 => {
+            let n = *n;
+
+            let pages = fixed_size_binary::Iter::new(
+                pages,
+                DataType::FixedSizeBinary(n),
+                num_rows,
+                chunk_size,
+            );
+
+            let pages = pages.map(move |maybe_array| {
+                let array = maybe_array?;
+                let values = array
+                    .values()
+                    .chunks_exact(n)
+                    .map(|value: &[u8]| i256(I256::new(super::super::convert_i128(value, n))))
+                    .collect::<Vec<_>>();
+                let validity = array.validity().cloned();
+
+                PrimitiveArray::<i256>::try_new(data_type.clone(), values.into(), validity)
+            });
+
+            let arrays = pages.map(|x| x.map(|x| x.boxed()));
+
+            Box::new(arrays) as _
+        },
+        (PhysicalType::FixedLenByteArray(n), Decimal256(_, _)) if *n <= 32 => {
+            let n = *n;
+
+            let pages = fixed_size_binary::Iter::new(
+                pages,
+                DataType::FixedSizeBinary(n),
+                num_rows,
+                chunk_size,
+            );
+
+            let pages = pages.map(move |maybe_array| {
+                let array = maybe_array?;
+                let values = array
+                    .values()
+                    .chunks_exact(n)
+                    .map(super::super::convert_i256)
+                    .collect::<Vec<_>>();
+                let validity = array.validity().cloned();
+
+                PrimitiveArray::<i256>::try_new(data_type.clone(), values.into(), validity)
+            });
+
+            let arrays = pages.map(|x| x.map(|x| x.boxed()));
+
+            Box::new(arrays) as _
+        },
+        (PhysicalType::FixedLenByteArray(n), Decimal256(_, _)) if *n > 32 => {
+            return Err(Error::NotYetImplemented(format!(
+                "Can't decode Decimal256 type from Fixed Size Byte Array of len {n:?}"
+            )))
+        },
+        (PhysicalType::Int32, Date64) => dyn_iter(iden(primitive::IntegerIter::new(
+            pages,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i32| x as i64 * 86400000,
+        ))),
+        (PhysicalType::Int64, Date64) => dyn_iter(iden(primitive::IntegerIter::new(
+            pages,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i64| x,
+        ))),
+        (PhysicalType::Int64, Int64 | Time64(_) | Duration(_)) => dyn_iter(iden(
+            primitive::IntegerIter::new(pages, data_type, num_rows, chunk_size, |x: i64| x),
+        )),
+        (PhysicalType::Int64, UInt64) => dyn_iter(iden(primitive::IntegerIter::new(
+            pages,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i64| x as u64,
+        ))),
+        (PhysicalType::Float, Float32) => dyn_iter(iden(primitive::Iter::new(
+            pages,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: f32| x,
+        ))),
+        (PhysicalType::Double, Float64) => dyn_iter(iden(primitive::Iter::new(
+            pages,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: f64| x,
+        ))),
+
+        (PhysicalType::ByteArray, Utf8 | Binary) => Box::new(binary::Iter::<i32, _>::new(
+            pages, data_type, chunk_size, num_rows,
+        )),
+        (PhysicalType::ByteArray, LargeBinary | LargeUtf8) => Box::new(
+            binary::Iter::<i64, _>::new(pages, data_type, chunk_size, num_rows),
+        ),
+
+        (_, Dictionary(key_type, _, _)) => {
+            return match_integer_type!(key_type, |$K| {
+                dict_read::<$K, _>(pages, physical_type, logical_type, data_type, num_rows, chunk_size)
+            })
+        },
+        (from, to) => {
+            return Err(Error::NotYetImplemented(format!(
+                "Reading parquet type {from:?} to {to:?} still not implemented"
+            )))
+        },
+    })
+}
+
+/// Unify the timestamp unit from parquet TimeUnit into arrow's TimeUnit
+/// Returns (a int64 factor, is_multiplier)
+fn unify_timestamp_unit(
+    logical_type: &Option<PrimitiveLogicalType>,
+    time_unit: TimeUnit,
+) -> (i64, bool) {
+    if let Some(PrimitiveLogicalType::Timestamp { unit, .. }) = logical_type {
+        match (*unit, time_unit) {
+            (ParquetTimeUnit::Milliseconds, TimeUnit::Millisecond)
+            | (ParquetTimeUnit::Microseconds, TimeUnit::Microsecond)
+            | (ParquetTimeUnit::Nanoseconds, TimeUnit::Nanosecond) => (1, true),
+
+            (ParquetTimeUnit::Milliseconds, TimeUnit::Second)
+            | (ParquetTimeUnit::Microseconds, TimeUnit::Millisecond)
+            | (ParquetTimeUnit::Nanoseconds, TimeUnit::Microsecond) => (1000, false),
+
+            (ParquetTimeUnit::Microseconds, TimeUnit::Second)
+            | (ParquetTimeUnit::Nanoseconds, TimeUnit::Millisecond) => (1_000_000, false),
+
+            (ParquetTimeUnit::Nanoseconds, TimeUnit::Second) => (1_000_000_000, false),
+
+            (ParquetTimeUnit::Milliseconds, TimeUnit::Microsecond)
+            | (ParquetTimeUnit::Microseconds, TimeUnit::Nanosecond) => (1_000, true),
+
+            (ParquetTimeUnit::Milliseconds, TimeUnit::Nanosecond) => (1_000_000, true),
+        }
+    } else {
+        (1, true)
+    }
+}
+
+#[inline]
+pub fn int96_to_i64_us(value: [u32; 3]) -> i64 {
+    const JULIAN_DAY_OF_EPOCH: i64 = 2_440_588;
+    const SECONDS_PER_DAY: i64 = 86_400;
+    const MICROS_PER_SECOND: i64 = 1_000_000;
+
+    let day = value[2] as i64;
+    let microseconds = (((value[1] as i64) << 32) + value[0] as i64) / 1_000;
+    let seconds = (day - JULIAN_DAY_OF_EPOCH) * SECONDS_PER_DAY;
+
+    seconds * MICROS_PER_SECOND + microseconds
+}
+
+#[inline]
+pub fn int96_to_i64_ms(value: [u32; 3]) -> i64 {
+    const JULIAN_DAY_OF_EPOCH: i64 = 2_440_588;
+    const SECONDS_PER_DAY: i64 = 86_400;
+    const MILLIS_PER_SECOND: i64 = 1_000;
+
+    let day = value[2] as i64;
+    let milliseconds = (((value[1] as i64) << 32) + value[0] as i64) / 1_000_000;
+    let seconds = (day - JULIAN_DAY_OF_EPOCH) * SECONDS_PER_DAY;
+
+    seconds * MILLIS_PER_SECOND + milliseconds
+}
+
+#[inline]
+pub fn int96_to_i64_s(value: [u32; 3]) -> i64 {
+    const JULIAN_DAY_OF_EPOCH: i64 = 2_440_588;
+    const SECONDS_PER_DAY: i64 = 86_400;
+
+    let day = value[2] as i64;
+    let seconds = (((value[1] as i64) << 32) + value[0] as i64) / 1_000_000_000;
+    let day_seconds = (day - JULIAN_DAY_OF_EPOCH) * SECONDS_PER_DAY;
+
+    day_seconds + seconds
+}
+
+fn timestamp<'a, I: Pages + 'a>(
+    pages: I,
+    physical_type: &PhysicalType,
+    logical_type: &Option<PrimitiveLogicalType>,
+    data_type: DataType,
+    num_rows: usize,
+    chunk_size: Option<usize>,
+    time_unit: TimeUnit,
+) -> Result<ArrayIter<'a>> {
+    if physical_type == &PhysicalType::Int96 {
+        return match time_unit {
+            TimeUnit::Nanosecond => Ok(dyn_iter(iden(primitive::Iter::new(
+                pages,
+                data_type,
+                num_rows,
+                chunk_size,
+                int96_to_i64_ns,
+            )))),
+            TimeUnit::Microsecond => Ok(dyn_iter(iden(primitive::Iter::new(
+                pages,
+                data_type,
+                num_rows,
+                chunk_size,
+                int96_to_i64_us,
+            )))),
+            TimeUnit::Millisecond => Ok(dyn_iter(iden(primitive::Iter::new(
+                pages,
+                data_type,
+                num_rows,
+                chunk_size,
+                int96_to_i64_ms,
+            )))),
+            TimeUnit::Second => Ok(dyn_iter(iden(primitive::Iter::new(
+                pages,
+                data_type,
+                num_rows,
+                chunk_size,
+                int96_to_i64_s,
+            )))),
+        };
+    };
+
+    if physical_type != &PhysicalType::Int64 {
+        return Err(Error::nyi(
+            "Can't decode a timestamp from a non-int64 parquet type",
+        ));
+    }
+
+    let iter = primitive::IntegerIter::new(pages, data_type, num_rows, chunk_size, |x: i64| x);
+    let (factor, is_multiplier) = unify_timestamp_unit(logical_type, time_unit);
+    match (factor, is_multiplier) {
+        (1, _) => Ok(dyn_iter(iden(iter))),
+        (a, true) => Ok(dyn_iter(op(iter, move |x| x * a))),
+        (a, false) => Ok(dyn_iter(op(iter, move |x| x / a))),
+    }
+}
+
+fn timestamp_dict<'a, K: DictionaryKey, I: Pages + 'a>(
+    pages: I,
+    physical_type: &PhysicalType,
+    logical_type: &Option<PrimitiveLogicalType>,
+    data_type: DataType,
+    num_rows: usize,
+    chunk_size: Option<usize>,
+    time_unit: TimeUnit,
+) -> Result<ArrayIter<'a>> {
+    if physical_type == &PhysicalType::Int96 {
+        let logical_type = PrimitiveLogicalType::Timestamp {
+            unit: ParquetTimeUnit::Nanoseconds,
+            is_adjusted_to_utc: false,
+        };
+        let (factor, is_multiplier) = unify_timestamp_unit(&Some(logical_type), time_unit);
+        return match (factor, is_multiplier) {
+            (a, true) => Ok(dyn_iter(primitive::DictIter::<K, _, _, _, _>::new(
+                pages,
+                DataType::Timestamp(TimeUnit::Nanosecond, None),
+                num_rows,
+                chunk_size,
+                move |x| int96_to_i64_ns(x) * a,
+            ))),
+            (a, false) => Ok(dyn_iter(primitive::DictIter::<K, _, _, _, _>::new(
+                pages,
+                DataType::Timestamp(TimeUnit::Nanosecond, None),
+                num_rows,
+                chunk_size,
+                move |x| int96_to_i64_ns(x) / a,
+            ))),
+        };
+    };
+
+    let (factor, is_multiplier) = unify_timestamp_unit(logical_type, time_unit);
+    match (factor, is_multiplier) {
+        (a, true) => Ok(dyn_iter(primitive::DictIter::<K, _, _, _, _>::new(
+            pages,
+            data_type,
+            num_rows,
+            chunk_size,
+            move |x: i64| x * a,
+        ))),
+        (a, false) => Ok(dyn_iter(primitive::DictIter::<K, _, _, _, _>::new(
+            pages,
+            data_type,
+            num_rows,
+            chunk_size,
+            move |x: i64| x / a,
+        ))),
+    }
+}
+
+fn dict_read<'a, K: DictionaryKey, I: Pages + 'a>(
+    iter: I,
+    physical_type: &PhysicalType,
+    logical_type: &Option<PrimitiveLogicalType>,
+    data_type: DataType,
+    num_rows: usize,
+    chunk_size: Option<usize>,
+) -> Result<ArrayIter<'a>> {
+    use DataType::*;
+    let values_data_type = if let Dictionary(_, v, _) = &data_type {
+        v.as_ref()
+    } else {
+        panic!()
+    };
+
+    Ok(match (physical_type, values_data_type.to_logical_type()) {
+        (PhysicalType::Int32, UInt8) => dyn_iter(primitive::DictIter::<K, _, _, _, _>::new(
+            iter,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i32| x as u8,
+        )),
+        (PhysicalType::Int32, UInt16) => dyn_iter(primitive::DictIter::<K, _, _, _, _>::new(
+            iter,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i32| x as u16,
+        )),
+        (PhysicalType::Int32, UInt32) => dyn_iter(primitive::DictIter::<K, _, _, _, _>::new(
+            iter,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i32| x as u32,
+        )),
+        (PhysicalType::Int64, UInt64) => dyn_iter(primitive::DictIter::<K, _, _, _, _>::new(
+            iter,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i64| x as u64,
+        )),
+        (PhysicalType::Int32, Int8) => dyn_iter(primitive::DictIter::<K, _, _, _, _>::new(
+            iter,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i32| x as i8,
+        )),
+        (PhysicalType::Int32, Int16) => dyn_iter(primitive::DictIter::<K, _, _, _, _>::new(
+            iter,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: i32| x as i16,
+        )),
+        (PhysicalType::Int32, Int32 | Date32 | Time32(_) | Interval(IntervalUnit::YearMonth)) => {
+            dyn_iter(primitive::DictIter::<K, _, _, _, _>::new(
+                iter,
+                data_type,
+                num_rows,
+                chunk_size,
+                |x: i32| x,
+            ))
+        },
+
+        (PhysicalType::Int64, Timestamp(time_unit, _)) => {
+            let time_unit = *time_unit;
+            return timestamp_dict::<K, _>(
+                iter,
+                physical_type,
+                logical_type,
+                data_type,
+                num_rows,
+                chunk_size,
+                time_unit,
+            );
+        },
+
+        (PhysicalType::Int64, Int64 | Date64 | Time64(_) | Duration(_)) => {
+            dyn_iter(primitive::DictIter::<K, _, _, _, _>::new(
+                iter,
+                data_type,
+                num_rows,
+                chunk_size,
+                |x: i64| x,
+            ))
+        },
+        (PhysicalType::Float, Float32) => dyn_iter(primitive::DictIter::<K, _, _, _, _>::new(
+            iter,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: f32| x,
+        )),
+        (PhysicalType::Double, Float64) => dyn_iter(primitive::DictIter::<K, _, _, _, _>::new(
+            iter,
+            data_type,
+            num_rows,
+            chunk_size,
+            |x: f64| x,
+        )),
+
+        (PhysicalType::ByteArray, Utf8 | Binary) => dyn_iter(binary::DictIter::<K, i32, _>::new(
+            iter, data_type, num_rows, chunk_size,
+        )),
+        (PhysicalType::ByteArray, LargeUtf8 | LargeBinary) => dyn_iter(
+            binary::DictIter::<K, i64, _>::new(iter, data_type, num_rows, chunk_size),
+        ),
+        (PhysicalType::FixedLenByteArray(_), FixedSizeBinary(_)) => dyn_iter(
+            fixed_size_binary::DictIter::<K, _>::new(iter, data_type, num_rows, chunk_size),
+        ),
+        other => {
+            return Err(Error::nyi(format!(
+                "Reading dictionaries of type {other:?}"
+            )))
+        },
+    })
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/struct_.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/struct_.rs
new file mode 100644
index 000000000000..947e7f1141e5
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/struct_.rs
@@ -0,0 +1,58 @@
+use super::nested_utils::{NestedArrayIter, NestedState};
+use crate::array::{Array, StructArray};
+use crate::datatypes::{DataType, Field};
+use crate::error::Error;
+
+/// An iterator adapter over [`NestedArrayIter`] assumed to be encoded as Struct arrays
+pub struct StructIterator<'a> {
+    iters: Vec<NestedArrayIter<'a>>,
+    fields: Vec<Field>,
+}
+
+impl<'a> StructIterator<'a> {
+    /// Creates a new [`StructIterator`] with `iters` and `fields`.
+    pub fn new(iters: Vec<NestedArrayIter<'a>>, fields: Vec<Field>) -> Self {
+        assert_eq!(iters.len(), fields.len());
+        Self { iters, fields }
+    }
+}
+
+impl<'a> Iterator for StructIterator<'a> {
+    type Item = Result<(NestedState, Box<dyn Array>), Error>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        let values = self
+            .iters
+            .iter_mut()
+            .map(|iter| iter.next())
+            .collect::<Vec<_>>();
+
+        if values.iter().any(|x| x.is_none()) {
+            return None;
+        }
+
+        // todo: unzip of Result not yet supported in stable Rust
+        let mut nested = vec![];
+        let mut new_values = vec![];
+        for x in values {
+            match x.unwrap() {
+                Ok((nest, values)) => {
+                    new_values.push(values);
+                    nested.push(nest);
+                },
+                Err(e) => return Some(Err(e)),
+            }
+        }
+        let mut nested = nested.pop().unwrap();
+        let (_, validity) = nested.nested.pop().unwrap().inner();
+
+        Some(Ok((
+            nested,
+            Box::new(StructArray::new(
+                DataType::Struct(self.fields.clone()),
+                new_values,
+                validity.and_then(|x| x.into()),
+            )),
+        )))
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/deserialize/utils.rs b/crates/nano-arrow/src/io/parquet/read/deserialize/utils.rs
new file mode 100644
index 000000000000..a39a7506d8e1
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/deserialize/utils.rs
@@ -0,0 +1,524 @@
+use std::collections::VecDeque;
+
+use parquet2::deserialize::{
+    FilteredHybridEncoded, FilteredHybridRleDecoderIter, HybridDecoderBitmapIter, HybridEncoded,
+};
+use parquet2::encoding::hybrid_rle;
+use parquet2::indexes::Interval;
+use parquet2::page::{split_buffer, DataPage, DictPage, Page};
+use parquet2::schema::Repetition;
+
+use super::super::Pages;
+use crate::bitmap::utils::BitmapIter;
+use crate::bitmap::MutableBitmap;
+use crate::error::Error;
+
+pub fn not_implemented(page: &DataPage) -> Error {
+    let is_optional = page.descriptor.primitive_type.field_info.repetition == Repetition::Optional;
+    let is_filtered = page.selected_rows().is_some();
+    let required = if is_optional { "optional" } else { "required" };
+    let is_filtered = if is_filtered { ", index-filtered" } else { "" };
+    Error::NotYetImplemented(format!(
+        "Decoding {:?} \"{:?}\"-encoded {} {} parquet pages",
+        page.descriptor.primitive_type.physical_type,
+        page.encoding(),
+        required,
+        is_filtered,
+    ))
+}
+
+/// A private trait representing structs that can receive elements.
+pub(super) trait Pushable<T>: Sized {
+    fn reserve(&mut self, additional: usize);
+    fn push(&mut self, value: T);
+    fn len(&self) -> usize;
+    fn push_null(&mut self);
+    fn extend_constant(&mut self, additional: usize, value: T);
+}
+
+impl Pushable<bool> for MutableBitmap {
+    #[inline]
+    fn reserve(&mut self, additional: usize) {
+        MutableBitmap::reserve(self, additional)
+    }
+    #[inline]
+    fn len(&self) -> usize {
+        self.len()
+    }
+
+    #[inline]
+    fn push(&mut self, value: bool) {
+        self.push(value)
+    }
+
+    #[inline]
+    fn push_null(&mut self) {
+        self.push(false)
+    }
+
+    #[inline]
+    fn extend_constant(&mut self, additional: usize, value: bool) {
+        self.extend_constant(additional, value)
+    }
+}
+
+impl<A: Copy + Default> Pushable<A> for Vec<A> {
+    #[inline]
+    fn reserve(&mut self, additional: usize) {
+        Vec::reserve(self, additional)
+    }
+    #[inline]
+    fn len(&self) -> usize {
+        self.len()
+    }
+
+    #[inline]
+    fn push_null(&mut self) {
+        self.push(A::default())
+    }
+
+    #[inline]
+    fn push(&mut self, value: A) {
+        self.push(value)
+    }
+
+    #[inline]
+    fn extend_constant(&mut self, additional: usize, value: A) {
+        self.resize(self.len() + additional, value);
+    }
+}
+
+/// The state of a partially deserialized page
+pub(super) trait PageValidity<'a> {
+    fn next_limited(&mut self, limit: usize) -> Option<FilteredHybridEncoded<'a>>;
+}
+
+#[derive(Debug, Clone)]
+pub struct FilteredOptionalPageValidity<'a> {
+    iter: FilteredHybridRleDecoderIter<'a>,
+    current: Option<(FilteredHybridEncoded<'a>, usize)>,
+}
+
+impl<'a> FilteredOptionalPageValidity<'a> {
+    pub fn try_new(page: &'a DataPage) -> Result<Self, Error> {
+        let (_, validity, _) = split_buffer(page)?;
+
+        let iter = hybrid_rle::Decoder::new(validity, 1);
+        let iter = HybridDecoderBitmapIter::new(iter, page.num_values());
+        let selected_rows = get_selected_rows(page);
+        let iter = FilteredHybridRleDecoderIter::new(iter, selected_rows);
+
+        Ok(Self {
+            iter,
+            current: None,
+        })
+    }
+
+    pub fn len(&self) -> usize {
+        self.iter.len()
+    }
+}
+
+pub fn get_selected_rows(page: &DataPage) -> VecDeque<Interval> {
+    page.selected_rows()
+        .unwrap_or(&[Interval::new(0, page.num_values())])
+        .iter()
+        .copied()
+        .collect()
+}
+
+impl<'a> PageValidity<'a> for FilteredOptionalPageValidity<'a> {
+    fn next_limited(&mut self, limit: usize) -> Option<FilteredHybridEncoded<'a>> {
+        let (run, own_offset) = if let Some((run, offset)) = self.current {
+            (run, offset)
+        } else {
+            // a new run
+            let run = self.iter.next()?.unwrap(); // no run -> None
+            self.current = Some((run, 0));
+            return self.next_limited(limit);
+        };
+
+        match run {
+            FilteredHybridEncoded::Bitmap {
+                values,
+                offset,
+                length,
+            } => {
+                let run_length = length - own_offset;
+
+                let length = limit.min(run_length);
+
+                if length == run_length {
+                    self.current = None;
+                } else {
+                    self.current = Some((run, own_offset + length));
+                }
+
+                Some(FilteredHybridEncoded::Bitmap {
+                    values,
+                    offset,
+                    length,
+                })
+            },
+            FilteredHybridEncoded::Repeated { is_set, length } => {
+                let run_length = length - own_offset;
+
+                let length = limit.min(run_length);
+
+                if length == run_length {
+                    self.current = None;
+                } else {
+                    self.current = Some((run, own_offset + length));
+                }
+
+                Some(FilteredHybridEncoded::Repeated { is_set, length })
+            },
+            FilteredHybridEncoded::Skipped(set) => {
+                self.current = None;
+                Some(FilteredHybridEncoded::Skipped(set))
+            },
+        }
+    }
+}
+
+pub struct Zip<V, I> {
+    validity: V,
+    values: I,
+}
+
+impl<V, I> Zip<V, I> {
+    pub fn new(validity: V, values: I) -> Self {
+        Self { validity, values }
+    }
+}
+
+impl<T, V: Iterator<Item = bool>, I: Iterator<Item = T>> Iterator for Zip<V, I> {
+    type Item = Option<T>;
+
+    #[inline]
+    fn next(&mut self) -> Option<Self::Item> {
+        self.validity
+            .next()
+            .map(|x| if x { self.values.next() } else { None })
+    }
+
+    #[inline]
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        self.validity.size_hint()
+    }
+}
+
+#[derive(Debug, Clone)]
+pub struct OptionalPageValidity<'a> {
+    iter: HybridDecoderBitmapIter<'a>,
+    current: Option<(HybridEncoded<'a>, usize)>,
+}
+
+impl<'a> OptionalPageValidity<'a> {
+    pub fn try_new(page: &'a DataPage) -> Result<Self, Error> {
+        let (_, validity, _) = split_buffer(page)?;
+
+        let iter = hybrid_rle::Decoder::new(validity, 1);
+        let iter = HybridDecoderBitmapIter::new(iter, page.num_values());
+        Ok(Self {
+            iter,
+            current: None,
+        })
+    }
+
+    /// Number of items remaining
+    pub fn len(&self) -> usize {
+        self.iter.len()
+            + self
+                .current
+                .as_ref()
+                .map(|(run, offset)| run.len() - offset)
+                .unwrap_or_default()
+    }
+
+    fn next_limited(&mut self, limit: usize) -> Option<FilteredHybridEncoded<'a>> {
+        let (run, offset) = if let Some((run, offset)) = self.current {
+            (run, offset)
+        } else {
+            // a new run
+            let run = self.iter.next()?.unwrap(); // no run -> None
+            self.current = Some((run, 0));
+            return self.next_limited(limit);
+        };
+
+        match run {
+            HybridEncoded::Bitmap(values, length) => {
+                let run_length = length - offset;
+
+                let length = limit.min(run_length);
+
+                if length == run_length {
+                    self.current = None;
+                } else {
+                    self.current = Some((run, offset + length));
+                }
+
+                Some(FilteredHybridEncoded::Bitmap {
+                    values,
+                    offset,
+                    length,
+                })
+            },
+            HybridEncoded::Repeated(is_set, run_length) => {
+                let run_length = run_length - offset;
+
+                let length = limit.min(run_length);
+
+                if length == run_length {
+                    self.current = None;
+                } else {
+                    self.current = Some((run, offset + length));
+                }
+
+                Some(FilteredHybridEncoded::Repeated { is_set, length })
+            },
+        }
+    }
+}
+
+impl<'a> PageValidity<'a> for OptionalPageValidity<'a> {
+    fn next_limited(&mut self, limit: usize) -> Option<FilteredHybridEncoded<'a>> {
+        self.next_limited(limit)
+    }
+}
+
+/// Extends a [`Pushable`] from an iterator of non-null values and an hybrid-rle decoder
+pub(super) fn extend_from_decoder<T: Default, P: Pushable<T>, I: Iterator<Item = T>>(
+    validity: &mut MutableBitmap,
+    page_validity: &mut dyn PageValidity,
+    limit: Option<usize>,
+    pushable: &mut P,
+    mut values_iter: I,
+) {
+    let limit = limit.unwrap_or(usize::MAX);
+
+    let mut runs = vec![];
+    let mut remaining = limit;
+    let mut reserve_pushable = 0;
+
+    // first do a scan so that we know how much to reserve up front
+    while remaining > 0 {
+        let run = page_validity.next_limited(remaining);
+        let run = if let Some(run) = run { run } else { break };
+
+        match run {
+            FilteredHybridEncoded::Bitmap { length, .. } => {
+                reserve_pushable += length;
+                remaining -= length;
+            },
+            FilteredHybridEncoded::Repeated { length, .. } => {
+                reserve_pushable += length;
+                remaining -= length;
+            },
+            _ => {},
+        };
+        runs.push(run)
+    }
+    pushable.reserve(reserve_pushable);
+    validity.reserve(reserve_pushable);
+
+    // then a second loop to really fill the buffers
+    for run in runs {
+        match run {
+            FilteredHybridEncoded::Bitmap {
+                values,
+                offset,
+                length,
+            } => {
+                // consume `length` items
+                let iter = BitmapIter::new(values, offset, length);
+                let iter = Zip::new(iter, &mut values_iter);
+
+                for item in iter {
+                    if let Some(item) = item {
+                        pushable.push(item)
+                    } else {
+                        pushable.push_null()
+                    }
+                }
+                validity.extend_from_slice(values, offset, length);
+            },
+            FilteredHybridEncoded::Repeated { is_set, length } => {
+                validity.extend_constant(length, is_set);
+                if is_set {
+                    for v in (&mut values_iter).take(length) {
+                        pushable.push(v)
+                    }
+                } else {
+                    pushable.extend_constant(length, T::default());
+                }
+            },
+            FilteredHybridEncoded::Skipped(valids) => for _ in values_iter.by_ref().take(valids) {},
+        };
+    }
+}
+
+/// The state of a partially deserialized page
+pub(super) trait PageState<'a>: std::fmt::Debug {
+    fn len(&self) -> usize;
+}
+
+/// The state of a partially deserialized page
+pub(super) trait DecodedState: std::fmt::Debug {
+    // the number of values that the state already has
+    fn len(&self) -> usize;
+}
+
+/// A decoder that knows how to map `State` -> Array
+pub(super) trait Decoder<'a> {
+    /// The state that this decoder derives from a [`DataPage`]. This is bound to the page.
+    type State: PageState<'a>;
+    /// The dictionary representation that the decoder uses
+    type Dict;
+    /// The target state that this Decoder decodes into.
+    type DecodedState: DecodedState;
+
+    /// Creates a new `Self::State`
+    fn build_state(
+        &self,
+        page: &'a DataPage,
+        dict: Option<&'a Self::Dict>,
+    ) -> Result<Self::State, Error>;
+
+    /// Initializes a new [`Self::DecodedState`].
+    fn with_capacity(&self, capacity: usize) -> Self::DecodedState;
+
+    /// extends [`Self::DecodedState`] by deserializing items in [`Self::State`].
+    /// It guarantees that the length of `decoded` is at most `decoded.len() + remaining`.
+    fn extend_from_state(
+        &self,
+        page: &mut Self::State,
+        decoded: &mut Self::DecodedState,
+        additional: usize,
+    );
+
+    /// Deserializes a [`DictPage`] into [`Self::Dict`].
+    fn deserialize_dict(&self, page: &DictPage) -> Self::Dict;
+}
+
+pub(super) fn extend_from_new_page<'a, T: Decoder<'a>>(
+    mut page: T::State,
+    chunk_size: Option<usize>,
+    items: &mut VecDeque<T::DecodedState>,
+    remaining: &mut usize,
+    decoder: &T,
+) {
+    let capacity = chunk_size.unwrap_or(0);
+    let chunk_size = chunk_size.unwrap_or(usize::MAX);
+
+    let mut decoded = if let Some(decoded) = items.pop_back() {
+        decoded
+    } else {
+        // there is no state => initialize it
+        decoder.with_capacity(capacity)
+    };
+    let existing = decoded.len();
+
+    let additional = (chunk_size - existing).min(*remaining);
+
+    decoder.extend_from_state(&mut page, &mut decoded, additional);
+    *remaining -= decoded.len() - existing;
+    items.push_back(decoded);
+
+    while page.len() > 0 && *remaining > 0 {
+        let additional = chunk_size.min(*remaining);
+
+        let mut decoded = decoder.with_capacity(additional);
+        decoder.extend_from_state(&mut page, &mut decoded, additional);
+        *remaining -= decoded.len();
+        items.push_back(decoded)
+    }
+}
+
+/// Represents what happened when a new page was consumed
+#[derive(Debug)]
+pub enum MaybeNext<P> {
+    /// Whether the page was sufficient to fill `chunk_size`
+    Some(P),
+    /// whether there are no more pages or intermediary decoded states
+    None,
+    /// Whether the page was insufficient to fill `chunk_size` and a new page is required
+    More,
+}
+
+#[inline]
+pub(super) fn next<'a, I: Pages, D: Decoder<'a>>(
+    iter: &'a mut I,
+    items: &'a mut VecDeque<D::DecodedState>,
+    dict: &'a mut Option<D::Dict>,
+    remaining: &'a mut usize,
+    chunk_size: Option<usize>,
+    decoder: &'a D,
+) -> MaybeNext<Result<D::DecodedState, Error>> {
+    // front[a1, a2, a3, ...]back
+    if items.len() > 1 {
+        return MaybeNext::Some(Ok(items.pop_front().unwrap()));
+    }
+    if (items.len() == 1) && items.front().unwrap().len() == chunk_size.unwrap_or(usize::MAX) {
+        return MaybeNext::Some(Ok(items.pop_front().unwrap()));
+    }
+    if *remaining == 0 {
+        return match items.pop_front() {
+            Some(decoded) => MaybeNext::Some(Ok(decoded)),
+            None => MaybeNext::None,
+        };
+    }
+
+    match iter.next() {
+        Err(e) => MaybeNext::Some(Err(e.into())),
+        Ok(Some(page)) => {
+            let page = match page {
+                Page::Data(page) => page,
+                Page::Dict(dict_page) => {
+                    *dict = Some(decoder.deserialize_dict(dict_page));
+                    return MaybeNext::More;
+                },
+            };
+
+            // there is a new page => consume the page from the start
+            let maybe_page = decoder.build_state(page, dict.as_ref());
+            let page = match maybe_page {
+                Ok(page) => page,
+                Err(e) => return MaybeNext::Some(Err(e)),
+            };
+
+            extend_from_new_page(page, chunk_size, items, remaining, decoder);
+
+            if (items.len() == 1) && items.front().unwrap().len() < chunk_size.unwrap_or(usize::MAX)
+            {
+                MaybeNext::More
+            } else {
+                let decoded = items.pop_front().unwrap();
+                MaybeNext::Some(Ok(decoded))
+            }
+        },
+        Ok(None) => {
+            if let Some(decoded) = items.pop_front() {
+                // we have a populated item and no more pages
+                // the only case where an item's length may be smaller than chunk_size
+                debug_assert!(decoded.len() <= chunk_size.unwrap_or(usize::MAX));
+                MaybeNext::Some(Ok(decoded))
+            } else {
+                MaybeNext::None
+            }
+        },
+    }
+}
+
+#[inline]
+pub(super) fn dict_indices_decoder(page: &DataPage) -> Result<hybrid_rle::HybridRleDecoder, Error> {
+    let (_, _, indices_buffer) = split_buffer(page)?;
+
+    // SPEC: Data page format: the bit width used to encode the entry ids stored as 1 byte (max bit width = 32),
+    // SPEC: followed by the values encoded using RLE/Bit packed described above (with the given bit width).
+    let bit_width = indices_buffer[0];
+    let indices_buffer = &indices_buffer[1..];
+
+    hybrid_rle::HybridRleDecoder::try_new(indices_buffer, bit_width as u32, page.num_values())
+        .map_err(Error::from)
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/file.rs b/crates/nano-arrow/src/io/parquet/read/file.rs
new file mode 100644
index 000000000000..750340c60ef7
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/file.rs
@@ -0,0 +1,205 @@
+use std::io::{Read, Seek};
+
+use parquet2::indexes::FilteredPage;
+
+use super::{RowGroupDeserializer, RowGroupMetaData};
+use crate::array::Array;
+use crate::chunk::Chunk;
+use crate::datatypes::Schema;
+use crate::error::Result;
+use crate::io::parquet::read::read_columns_many;
+
+/// An iterator of [`Chunk`]s coming from row groups of a parquet file.
+///
+/// This can be thought of a flatten chain of [`Iterator<Item=Chunk>`] - each row group is sequentially
+/// mapped to an [`Iterator<Item=Chunk>`] and each iterator is iterated upon until either the limit
+/// or the last iterator ends.
+/// # Implementation
+/// This iterator is single threaded on both IO-bounded and CPU-bounded tasks, and mixes them.
+pub struct FileReader<R: Read + Seek> {
+    row_groups: RowGroupReader<R>,
+    remaining_rows: usize,
+    current_row_group: Option<RowGroupDeserializer>,
+}
+
+impl<R: Read + Seek> FileReader<R> {
+    /// Returns a new [`FileReader`].
+    pub fn new(
+        reader: R,
+        row_groups: Vec<RowGroupMetaData>,
+        schema: Schema,
+        chunk_size: Option<usize>,
+        limit: Option<usize>,
+        page_indexes: Option<Vec<Vec<Vec<Vec<FilteredPage>>>>>,
+    ) -> Self {
+        let row_groups =
+            RowGroupReader::new(reader, schema, row_groups, chunk_size, limit, page_indexes);
+
+        Self {
+            row_groups,
+            remaining_rows: limit.unwrap_or(usize::MAX),
+            current_row_group: None,
+        }
+    }
+
+    fn next_row_group(&mut self) -> Result<Option<RowGroupDeserializer>> {
+        let result = self.row_groups.next().transpose()?;
+
+        // If current_row_group is None, then there will be no elements to remove.
+        if self.current_row_group.is_some() {
+            self.remaining_rows = self.remaining_rows.saturating_sub(
+                result
+                    .as_ref()
+                    .map(|x| x.num_rows())
+                    .unwrap_or(self.remaining_rows),
+            );
+        }
+        Ok(result)
+    }
+
+    /// Returns the [`Schema`] associated to this file.
+    pub fn schema(&self) -> &Schema {
+        &self.row_groups.schema
+    }
+}
+
+impl<R: Read + Seek> Iterator for FileReader<R> {
+    type Item = Result<Chunk<Box<dyn Array>>>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        if self.remaining_rows == 0 {
+            // reached the limit
+            return None;
+        }
+
+        if let Some(row_group) = &mut self.current_row_group {
+            match row_group.next() {
+                // no more chunks in the current row group => try a new one
+                None => match self.next_row_group() {
+                    Ok(Some(row_group)) => {
+                        self.current_row_group = Some(row_group);
+                        // new found => pull again
+                        self.next()
+                    },
+                    Ok(None) => {
+                        self.current_row_group = None;
+                        None
+                    },
+                    Err(e) => Some(Err(e)),
+                },
+                other => other,
+            }
+        } else {
+            match self.next_row_group() {
+                Ok(Some(row_group)) => {
+                    self.current_row_group = Some(row_group);
+                    self.next()
+                },
+                Ok(None) => {
+                    self.current_row_group = None;
+                    None
+                },
+                Err(e) => Some(Err(e)),
+            }
+        }
+    }
+}
+
+/// An [`Iterator<Item=RowGroupDeserializer>`] from row groups of a parquet file.
+///
+/// # Implementation
+/// Advancing this iterator is IO-bounded - each iteration reads all the column chunks from the file
+/// to memory and attaches [`RowGroupDeserializer`] to them so that they can be iterated in chunks.
+pub struct RowGroupReader<R: Read + Seek> {
+    reader: R,
+    schema: Schema,
+    row_groups: std::vec::IntoIter<RowGroupMetaData>,
+    chunk_size: Option<usize>,
+    remaining_rows: usize,
+    page_indexes: Option<std::vec::IntoIter<Vec<Vec<Vec<FilteredPage>>>>>,
+}
+
+impl<R: Read + Seek> RowGroupReader<R> {
+    /// Returns a new [`RowGroupReader`]
+    pub fn new(
+        reader: R,
+        schema: Schema,
+        row_groups: Vec<RowGroupMetaData>,
+        chunk_size: Option<usize>,
+        limit: Option<usize>,
+        page_indexes: Option<Vec<Vec<Vec<Vec<FilteredPage>>>>>,
+    ) -> Self {
+        if let Some(pages) = &page_indexes {
+            assert_eq!(pages.len(), row_groups.len())
+        }
+        Self {
+            reader,
+            schema,
+            row_groups: row_groups.into_iter(),
+            chunk_size,
+            remaining_rows: limit.unwrap_or(usize::MAX),
+            page_indexes: page_indexes.map(|pages| pages.into_iter()),
+        }
+    }
+
+    #[inline]
+    fn _next(&mut self) -> Result<Option<RowGroupDeserializer>> {
+        if self.schema.fields.is_empty() {
+            return Ok(None);
+        }
+        if self.remaining_rows == 0 {
+            // reached the limit
+            return Ok(None);
+        }
+
+        let row_group = if let Some(row_group) = self.row_groups.next() {
+            row_group
+        } else {
+            return Ok(None);
+        };
+
+        let pages = self.page_indexes.as_mut().and_then(|iter| iter.next());
+
+        // the number of rows depends on whether indexes are selected or not.
+        let num_rows = pages
+            .as_ref()
+            .map(|x| {
+                // first field, first column within that field
+                x[0][0]
+                    .iter()
+                    .map(|page| {
+                        page.selected_rows
+                            .iter()
+                            .map(|interval| interval.length)
+                            .sum::<usize>()
+                    })
+                    .sum()
+            })
+            .unwrap_or_else(|| row_group.num_rows());
+
+        let column_chunks = read_columns_many(
+            &mut self.reader,
+            &row_group,
+            self.schema.fields.clone(),
+            self.chunk_size,
+            Some(self.remaining_rows),
+            pages,
+        )?;
+
+        let result = RowGroupDeserializer::new(column_chunks, num_rows, Some(self.remaining_rows));
+        self.remaining_rows = self.remaining_rows.saturating_sub(num_rows);
+        Ok(Some(result))
+    }
+}
+
+impl<R: Read + Seek> Iterator for RowGroupReader<R> {
+    type Item = Result<RowGroupDeserializer>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        self._next().transpose()
+    }
+
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        self.row_groups.size_hint()
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/indexes/binary.rs b/crates/nano-arrow/src/io/parquet/read/indexes/binary.rs
new file mode 100644
index 000000000000..9a7c7c4ca90b
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/indexes/binary.rs
@@ -0,0 +1,40 @@
+use parquet2::indexes::PageIndex;
+
+use super::ColumnPageStatistics;
+use crate::array::{Array, BinaryArray, PrimitiveArray, Utf8Array};
+use crate::datatypes::{DataType, PhysicalType};
+use crate::error::Error;
+use crate::trusted_len::TrustedLen;
+
+pub fn deserialize(
+    indexes: &[PageIndex<Vec<u8>>],
+    data_type: &DataType,
+) -> Result<ColumnPageStatistics, Error> {
+    Ok(ColumnPageStatistics {
+        min: deserialize_binary_iter(indexes.iter().map(|index| index.min.as_ref()), data_type)?,
+        max: deserialize_binary_iter(indexes.iter().map(|index| index.max.as_ref()), data_type)?,
+        null_count: PrimitiveArray::from_trusted_len_iter(
+            indexes
+                .iter()
+                .map(|index| index.null_count.map(|x| x as u64)),
+        ),
+    })
+}
+
+fn deserialize_binary_iter<'a, I: TrustedLen<Item = Option<&'a Vec<u8>>>>(
+    iter: I,
+    data_type: &DataType,
+) -> Result<Box<dyn Array>, Error> {
+    match data_type.to_physical_type() {
+        PhysicalType::LargeBinary => Ok(Box::new(BinaryArray::<i64>::from_iter(iter))),
+        PhysicalType::Utf8 => {
+            let iter = iter.map(|x| x.map(|x| std::str::from_utf8(x)).transpose());
+            Ok(Box::new(Utf8Array::<i32>::try_from_trusted_len_iter(iter)?))
+        },
+        PhysicalType::LargeUtf8 => {
+            let iter = iter.map(|x| x.map(|x| std::str::from_utf8(x)).transpose());
+            Ok(Box::new(Utf8Array::<i64>::try_from_trusted_len_iter(iter)?))
+        },
+        _ => Ok(Box::new(BinaryArray::<i32>::from_iter(iter))),
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/indexes/boolean.rs b/crates/nano-arrow/src/io/parquet/read/indexes/boolean.rs
new file mode 100644
index 000000000000..70977197d103
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/indexes/boolean.rs
@@ -0,0 +1,20 @@
+use parquet2::indexes::PageIndex;
+
+use super::ColumnPageStatistics;
+use crate::array::{BooleanArray, PrimitiveArray};
+
+pub fn deserialize(indexes: &[PageIndex<bool>]) -> ColumnPageStatistics {
+    ColumnPageStatistics {
+        min: Box::new(BooleanArray::from_trusted_len_iter(
+            indexes.iter().map(|index| index.min),
+        )),
+        max: Box::new(BooleanArray::from_trusted_len_iter(
+            indexes.iter().map(|index| index.max),
+        )),
+        null_count: PrimitiveArray::from_trusted_len_iter(
+            indexes
+                .iter()
+                .map(|index| index.null_count.map(|x| x as u64)),
+        ),
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/indexes/fixed_len_binary.rs b/crates/nano-arrow/src/io/parquet/read/indexes/fixed_len_binary.rs
new file mode 100644
index 000000000000..26002e5857d5
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/indexes/fixed_len_binary.rs
@@ -0,0 +1,67 @@
+use parquet2::indexes::PageIndex;
+
+use super::ColumnPageStatistics;
+use crate::array::{Array, FixedSizeBinaryArray, MutableFixedSizeBinaryArray, PrimitiveArray};
+use crate::datatypes::{DataType, PhysicalType, PrimitiveType};
+use crate::trusted_len::TrustedLen;
+use crate::types::{i256, NativeType};
+
+pub fn deserialize(indexes: &[PageIndex<Vec<u8>>], data_type: DataType) -> ColumnPageStatistics {
+    ColumnPageStatistics {
+        min: deserialize_binary_iter(
+            indexes.iter().map(|index| index.min.as_ref()),
+            data_type.clone(),
+        ),
+        max: deserialize_binary_iter(indexes.iter().map(|index| index.max.as_ref()), data_type),
+        null_count: PrimitiveArray::from_trusted_len_iter(
+            indexes
+                .iter()
+                .map(|index| index.null_count.map(|x| x as u64)),
+        ),
+    }
+}
+
+fn deserialize_binary_iter<'a, I: TrustedLen<Item = Option<&'a Vec<u8>>>>(
+    iter: I,
+    data_type: DataType,
+) -> Box<dyn Array> {
+    match data_type.to_physical_type() {
+        PhysicalType::Primitive(PrimitiveType::Int128) => {
+            Box::new(PrimitiveArray::from_trusted_len_iter(iter.map(|v| {
+                v.map(|x| {
+                    // Copy the fixed-size byte value to the start of a 16 byte stack
+                    // allocated buffer, then use an arithmetic right shift to fill in
+                    // MSBs, which accounts for leading 1's in negative (two's complement)
+                    // values.
+                    let n = x.len();
+                    let mut bytes = [0u8; 16];
+                    bytes[..n].copy_from_slice(x);
+                    i128::from_be_bytes(bytes) >> (8 * (16 - n))
+                })
+            })))
+        },
+        PhysicalType::Primitive(PrimitiveType::Int256) => {
+            Box::new(PrimitiveArray::from_trusted_len_iter(iter.map(|v| {
+                v.map(|x| {
+                    let n = x.len();
+                    let mut bytes = [0u8; 32];
+                    bytes[..n].copy_from_slice(x);
+                    i256::from_be_bytes(bytes)
+                })
+            })))
+        },
+        _ => {
+            let mut a = MutableFixedSizeBinaryArray::try_new(
+                data_type,
+                Vec::with_capacity(iter.size_hint().0),
+                None,
+            )
+            .unwrap();
+            for item in iter {
+                a.push(item);
+            }
+            let a: FixedSizeBinaryArray = a.into();
+            Box::new(a)
+        },
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/indexes/mod.rs b/crates/nano-arrow/src/io/parquet/read/indexes/mod.rs
new file mode 100644
index 000000000000..b60b717ebfd5
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/indexes/mod.rs
@@ -0,0 +1,381 @@
+//! API to perform page-level filtering (also known as indexes)
+use parquet2::error::Error as ParquetError;
+use parquet2::indexes::{
+    select_pages, BooleanIndex, ByteIndex, FixedLenByteIndex, Index as ParquetIndex, NativeIndex,
+    PageLocation,
+};
+use parquet2::metadata::{ColumnChunkMetaData, RowGroupMetaData};
+use parquet2::read::{read_columns_indexes as _read_columns_indexes, read_pages_locations};
+use parquet2::schema::types::PhysicalType as ParquetPhysicalType;
+
+mod binary;
+mod boolean;
+mod fixed_len_binary;
+mod primitive;
+
+use std::collections::VecDeque;
+use std::io::{Read, Seek};
+
+pub use parquet2::indexes::{FilteredPage, Interval};
+
+use super::get_field_pages;
+use crate::array::{Array, UInt64Array};
+use crate::datatypes::{DataType, Field, PhysicalType, PrimitiveType};
+use crate::error::Error;
+
+/// Page statistics of an Arrow field.
+#[derive(Debug, PartialEq)]
+pub enum FieldPageStatistics {
+    /// Variant used for fields with a single parquet column (e.g. primitives, dictionaries, list)
+    Single(ColumnPageStatistics),
+    /// Variant used for fields with multiple parquet columns (e.g. Struct, Map)
+    Multiple(Vec<FieldPageStatistics>),
+}
+
+impl From<ColumnPageStatistics> for FieldPageStatistics {
+    fn from(column: ColumnPageStatistics) -> Self {
+        Self::Single(column)
+    }
+}
+
+/// [`ColumnPageStatistics`] contains the minimum, maximum, and null_count
+/// of each page of a parquet column, as an [`Array`].
+/// This struct has the following invariants:
+/// * `min`, `max` and `null_count` have the same length (equal to the number of pages in the column)
+/// * `min`, `max` and `null_count` are guaranteed to be non-null
+/// * `min` and `max` have the same logical type
+#[derive(Debug, PartialEq)]
+pub struct ColumnPageStatistics {
+    /// The minimum values in the pages
+    pub min: Box<dyn Array>,
+    /// The maximum values in the pages
+    pub max: Box<dyn Array>,
+    /// The number of null values in the pages.
+    pub null_count: UInt64Array,
+}
+
+/// Given a sequence of [`ParquetIndex`] representing the page indexes of each column in the
+/// parquet file, returns the page-level statistics as a [`FieldPageStatistics`].
+///
+/// This function maps timestamps, decimal types, etc. accordingly.
+/// # Implementation
+/// This function is CPU-bounded `O(P)` where `P` is the total number of pages on all columns.
+/// # Error
+/// This function errors iff the value is not deserializable to arrow (e.g. invalid utf-8)
+fn deserialize(
+    indexes: &mut VecDeque<&Box<dyn ParquetIndex>>,
+    data_type: DataType,
+) -> Result<FieldPageStatistics, Error> {
+    match data_type.to_physical_type() {
+        PhysicalType::Boolean => {
+            let index = indexes
+                .pop_front()
+                .unwrap()
+                .as_any()
+                .downcast_ref::<BooleanIndex>()
+                .unwrap();
+            Ok(boolean::deserialize(&index.indexes).into())
+        },
+        PhysicalType::Primitive(PrimitiveType::Int128) => {
+            let index = indexes.pop_front().unwrap();
+            match index.physical_type() {
+                ParquetPhysicalType::Int32 => {
+                    let index = index.as_any().downcast_ref::<NativeIndex<i32>>().unwrap();
+                    Ok(primitive::deserialize_i32(&index.indexes, data_type).into())
+                },
+                parquet2::schema::types::PhysicalType::Int64 => {
+                    let index = index.as_any().downcast_ref::<NativeIndex<i64>>().unwrap();
+                    Ok(
+                        primitive::deserialize_i64(
+                            &index.indexes,
+                            &index.primitive_type,
+                            data_type,
+                        )
+                        .into(),
+                    )
+                },
+                parquet2::schema::types::PhysicalType::FixedLenByteArray(_) => {
+                    let index = index.as_any().downcast_ref::<FixedLenByteIndex>().unwrap();
+                    Ok(fixed_len_binary::deserialize(&index.indexes, data_type).into())
+                },
+                other => Err(Error::nyi(format!(
+                    "Deserialize {other:?} to arrow's int64"
+                ))),
+            }
+        },
+        PhysicalType::Primitive(PrimitiveType::Int256) => {
+            let index = indexes.pop_front().unwrap();
+            match index.physical_type() {
+                ParquetPhysicalType::Int32 => {
+                    let index = index.as_any().downcast_ref::<NativeIndex<i32>>().unwrap();
+                    Ok(primitive::deserialize_i32(&index.indexes, data_type).into())
+                },
+                parquet2::schema::types::PhysicalType::Int64 => {
+                    let index = index.as_any().downcast_ref::<NativeIndex<i64>>().unwrap();
+                    Ok(
+                        primitive::deserialize_i64(
+                            &index.indexes,
+                            &index.primitive_type,
+                            data_type,
+                        )
+                        .into(),
+                    )
+                },
+                parquet2::schema::types::PhysicalType::FixedLenByteArray(_) => {
+                    let index = index.as_any().downcast_ref::<FixedLenByteIndex>().unwrap();
+                    Ok(fixed_len_binary::deserialize(&index.indexes, data_type).into())
+                },
+                other => Err(Error::nyi(format!(
+                    "Deserialize {other:?} to arrow's int64"
+                ))),
+            }
+        },
+        PhysicalType::Primitive(PrimitiveType::UInt8)
+        | PhysicalType::Primitive(PrimitiveType::UInt16)
+        | PhysicalType::Primitive(PrimitiveType::UInt32)
+        | PhysicalType::Primitive(PrimitiveType::Int32) => {
+            let index = indexes
+                .pop_front()
+                .unwrap()
+                .as_any()
+                .downcast_ref::<NativeIndex<i32>>()
+                .unwrap();
+            Ok(primitive::deserialize_i32(&index.indexes, data_type).into())
+        },
+        PhysicalType::Primitive(PrimitiveType::UInt64)
+        | PhysicalType::Primitive(PrimitiveType::Int64) => {
+            let index = indexes.pop_front().unwrap();
+            match index.physical_type() {
+                ParquetPhysicalType::Int64 => {
+                    let index = index.as_any().downcast_ref::<NativeIndex<i64>>().unwrap();
+                    Ok(
+                        primitive::deserialize_i64(
+                            &index.indexes,
+                            &index.primitive_type,
+                            data_type,
+                        )
+                        .into(),
+                    )
+                },
+                parquet2::schema::types::PhysicalType::Int96 => {
+                    let index = index
+                        .as_any()
+                        .downcast_ref::<NativeIndex<[u32; 3]>>()
+                        .unwrap();
+                    Ok(primitive::deserialize_i96(&index.indexes, data_type).into())
+                },
+                other => Err(Error::nyi(format!(
+                    "Deserialize {other:?} to arrow's int64"
+                ))),
+            }
+        },
+        PhysicalType::Primitive(PrimitiveType::Float32) => {
+            let index = indexes
+                .pop_front()
+                .unwrap()
+                .as_any()
+                .downcast_ref::<NativeIndex<f32>>()
+                .unwrap();
+            Ok(primitive::deserialize_id(&index.indexes, data_type).into())
+        },
+        PhysicalType::Primitive(PrimitiveType::Float64) => {
+            let index = indexes
+                .pop_front()
+                .unwrap()
+                .as_any()
+                .downcast_ref::<NativeIndex<f64>>()
+                .unwrap();
+            Ok(primitive::deserialize_id(&index.indexes, data_type).into())
+        },
+        PhysicalType::Binary
+        | PhysicalType::LargeBinary
+        | PhysicalType::Utf8
+        | PhysicalType::LargeUtf8 => {
+            let index = indexes
+                .pop_front()
+                .unwrap()
+                .as_any()
+                .downcast_ref::<ByteIndex>()
+                .unwrap();
+            binary::deserialize(&index.indexes, &data_type).map(|x| x.into())
+        },
+        PhysicalType::FixedSizeBinary => {
+            let index = indexes
+                .pop_front()
+                .unwrap()
+                .as_any()
+                .downcast_ref::<FixedLenByteIndex>()
+                .unwrap();
+            Ok(fixed_len_binary::deserialize(&index.indexes, data_type).into())
+        },
+        PhysicalType::Dictionary(_) => {
+            if let DataType::Dictionary(_, inner, _) = data_type.to_logical_type() {
+                deserialize(indexes, (**inner).clone())
+            } else {
+                unreachable!()
+            }
+        },
+        PhysicalType::List => {
+            if let DataType::List(inner) = data_type.to_logical_type() {
+                deserialize(indexes, inner.data_type.clone())
+            } else {
+                unreachable!()
+            }
+        },
+        PhysicalType::LargeList => {
+            if let DataType::LargeList(inner) = data_type.to_logical_type() {
+                deserialize(indexes, inner.data_type.clone())
+            } else {
+                unreachable!()
+            }
+        },
+        PhysicalType::Map => {
+            if let DataType::Map(inner, _) = data_type.to_logical_type() {
+                deserialize(indexes, inner.data_type.clone())
+            } else {
+                unreachable!()
+            }
+        },
+        PhysicalType::Struct => {
+            let children_fields = if let DataType::Struct(children) = data_type.to_logical_type() {
+                children
+            } else {
+                unreachable!()
+            };
+            let children = children_fields
+                .iter()
+                .map(|child| deserialize(indexes, child.data_type.clone()))
+                .collect::<Result<Vec<_>, Error>>()?;
+
+            Ok(FieldPageStatistics::Multiple(children))
+        },
+
+        other => Err(Error::nyi(format!(
+            "Deserialize into arrow's {other:?} page index"
+        ))),
+    }
+}
+
+/// Checks whether the row group have page index information (page statistics)
+pub fn has_indexes(row_group: &RowGroupMetaData) -> bool {
+    row_group
+        .columns()
+        .iter()
+        .all(|chunk| chunk.column_chunk().column_index_offset.is_some())
+}
+
+/// Reads the column indexes from the reader assuming a valid set of derived Arrow fields
+/// for all parquet the columns in the file.
+///
+/// It returns one [`FieldPageStatistics`] per field in `fields`
+///
+/// This function is expected to be used to filter out parquet pages.
+///
+/// # Implementation
+/// This function is IO-bounded and calls `reader.read_exact` exactly once.
+/// # Error
+/// Errors iff the indexes can't be read or their deserialization to arrow is incorrect (e.g. invalid utf-8)
+pub fn read_columns_indexes<R: Read + Seek>(
+    reader: &mut R,
+    chunks: &[ColumnChunkMetaData],
+    fields: &[Field],
+) -> Result<Vec<FieldPageStatistics>, Error> {
+    let indexes = _read_columns_indexes(reader, chunks)?;
+
+    fields
+        .iter()
+        .map(|field| {
+            let indexes = get_field_pages(chunks, &indexes, &field.name);
+            let mut indexes = indexes.into_iter().collect();
+
+            deserialize(&mut indexes, field.data_type.clone())
+        })
+        .collect()
+}
+
+/// Returns the set of (row) intervals of the pages.
+pub fn compute_page_row_intervals(
+    locations: &[PageLocation],
+    num_rows: usize,
+) -> Result<Vec<Interval>, ParquetError> {
+    if locations.is_empty() {
+        return Ok(vec![]);
+    };
+
+    let last = (|| {
+        let start: usize = locations.last().unwrap().first_row_index.try_into()?;
+        let length = num_rows - start;
+        Result::<_, ParquetError>::Ok(Interval::new(start, length))
+    })();
+
+    let pages_lengths = locations
+        .windows(2)
+        .map(|x| {
+            let start = usize::try_from(x[0].first_row_index)?;
+            let length = usize::try_from(x[1].first_row_index - x[0].first_row_index)?;
+            Ok(Interval::new(start, length))
+        })
+        .chain(std::iter::once(last));
+    pages_lengths.collect()
+}
+
+/// Reads all page locations and index locations (IO-bounded) and uses `predicate` to compute
+/// the set of [`FilteredPage`] that fulfill the predicate.
+///
+/// The non-trivial argument of this function is `predicate`, that controls which pages are selected.
+/// Its signature contains 2 arguments:
+/// * 0th argument (indexes): contains one [`ColumnPageStatistics`] (page statistics) per field.
+///   Use it to evaluate the predicate against
+/// * 1th argument (intervals): contains one [`Vec<Vec<Interval>>`] (row positions) per field.
+///   For each field, the outermost vector corresponds to each parquet column:
+///   a primitive field contains 1 column, a struct field with 2 primitive fields contain 2 columns.
+///   The inner `Vec<Interval>` contains one [`Interval`] per page: its length equals the length of [`ColumnPageStatistics`].
+/// It returns a single [`Vec<Interval>`] denoting the set of intervals that the predicate selects (over all columns).
+///
+/// This returns one item per `field`. For each field, there is one item per column (for non-nested types it returns one column)
+/// and finally [`Vec<FilteredPage>`], that corresponds to the set of selected pages.
+pub fn read_filtered_pages<
+    R: Read + Seek,
+    F: Fn(&[FieldPageStatistics], &[Vec<Vec<Interval>>]) -> Vec<Interval>,
+>(
+    reader: &mut R,
+    row_group: &RowGroupMetaData,
+    fields: &[Field],
+    predicate: F,
+    //is_intersection: bool,
+) -> Result<Vec<Vec<Vec<FilteredPage>>>, Error> {
+    let num_rows = row_group.num_rows();
+
+    // one vec per column
+    let locations = read_pages_locations(reader, row_group.columns())?;
+    // one Vec<Vec<>> per field (non-nested contain a single entry on the first column)
+    let locations = fields
+        .iter()
+        .map(|field| get_field_pages(row_group.columns(), &locations, &field.name))
+        .collect::<Vec<_>>();
+
+    // one ColumnPageStatistics per field
+    let indexes = read_columns_indexes(reader, row_group.columns(), fields)?;
+
+    let intervals = locations
+        .iter()
+        .map(|locations| {
+            locations
+                .iter()
+                .map(|locations| Ok(compute_page_row_intervals(locations, num_rows)?))
+                .collect::<Result<Vec<_>, Error>>()
+        })
+        .collect::<Result<Vec<_>, Error>>()?;
+
+    let intervals = predicate(&indexes, &intervals);
+
+    locations
+        .into_iter()
+        .map(|locations| {
+            locations
+                .into_iter()
+                .map(|locations| Ok(select_pages(&intervals, locations, num_rows)?))
+                .collect::<Result<Vec<_>, Error>>()
+        })
+        .collect()
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/indexes/primitive.rs b/crates/nano-arrow/src/io/parquet/read/indexes/primitive.rs
new file mode 100644
index 000000000000..90e52e4a4aaf
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/indexes/primitive.rs
@@ -0,0 +1,222 @@
+use ethnum::I256;
+use parquet2::indexes::PageIndex;
+use parquet2::schema::types::{PrimitiveLogicalType, PrimitiveType, TimeUnit as ParquetTimeUnit};
+use parquet2::types::int96_to_i64_ns;
+
+use super::ColumnPageStatistics;
+use crate::array::{Array, MutablePrimitiveArray, PrimitiveArray};
+use crate::datatypes::{DataType, TimeUnit};
+use crate::trusted_len::TrustedLen;
+use crate::types::{i256, NativeType};
+
+#[inline]
+fn deserialize_int32<I: TrustedLen<Item = Option<i32>>>(
+    iter: I,
+    data_type: DataType,
+) -> Box<dyn Array> {
+    use DataType::*;
+    match data_type.to_logical_type() {
+        UInt8 => Box::new(
+            PrimitiveArray::<u8>::from_trusted_len_iter(iter.map(|x| x.map(|x| x as u8)))
+                .to(data_type),
+        ) as _,
+        UInt16 => Box::new(
+            PrimitiveArray::<u16>::from_trusted_len_iter(iter.map(|x| x.map(|x| x as u16)))
+                .to(data_type),
+        ),
+        UInt32 => Box::new(
+            PrimitiveArray::<u32>::from_trusted_len_iter(iter.map(|x| x.map(|x| x as u32)))
+                .to(data_type),
+        ),
+        Decimal(_, _) => Box::new(
+            PrimitiveArray::<i128>::from_trusted_len_iter(iter.map(|x| x.map(|x| x as i128)))
+                .to(data_type),
+        ),
+        Decimal256(_, _) => Box::new(
+            PrimitiveArray::<i256>::from_trusted_len_iter(
+                iter.map(|x| x.map(|x| i256(I256::new(x.into())))),
+            )
+            .to(data_type),
+        ) as _,
+        _ => Box::new(PrimitiveArray::<i32>::from_trusted_len_iter(iter).to(data_type)),
+    }
+}
+
+#[inline]
+fn timestamp(
+    array: &mut MutablePrimitiveArray<i64>,
+    time_unit: TimeUnit,
+    logical_type: Option<PrimitiveLogicalType>,
+) {
+    let unit = if let Some(PrimitiveLogicalType::Timestamp { unit, .. }) = logical_type {
+        unit
+    } else {
+        return;
+    };
+
+    match (unit, time_unit) {
+        (ParquetTimeUnit::Milliseconds, TimeUnit::Second) => array
+            .values_mut_slice()
+            .iter_mut()
+            .for_each(|x| *x /= 1_000),
+        (ParquetTimeUnit::Microseconds, TimeUnit::Second) => array
+            .values_mut_slice()
+            .iter_mut()
+            .for_each(|x| *x /= 1_000_000),
+        (ParquetTimeUnit::Nanoseconds, TimeUnit::Second) => array
+            .values_mut_slice()
+            .iter_mut()
+            .for_each(|x| *x /= 1_000_000_000),
+
+        (ParquetTimeUnit::Milliseconds, TimeUnit::Millisecond) => {},
+        (ParquetTimeUnit::Microseconds, TimeUnit::Millisecond) => array
+            .values_mut_slice()
+            .iter_mut()
+            .for_each(|x| *x /= 1_000),
+        (ParquetTimeUnit::Nanoseconds, TimeUnit::Millisecond) => array
+            .values_mut_slice()
+            .iter_mut()
+            .for_each(|x| *x /= 1_000_000),
+
+        (ParquetTimeUnit::Milliseconds, TimeUnit::Microsecond) => array
+            .values_mut_slice()
+            .iter_mut()
+            .for_each(|x| *x *= 1_000),
+        (ParquetTimeUnit::Microseconds, TimeUnit::Microsecond) => {},
+        (ParquetTimeUnit::Nanoseconds, TimeUnit::Microsecond) => array
+            .values_mut_slice()
+            .iter_mut()
+            .for_each(|x| *x /= 1_000),
+
+        (ParquetTimeUnit::Milliseconds, TimeUnit::Nanosecond) => array
+            .values_mut_slice()
+            .iter_mut()
+            .for_each(|x| *x *= 1_000_000),
+        (ParquetTimeUnit::Microseconds, TimeUnit::Nanosecond) => array
+            .values_mut_slice()
+            .iter_mut()
+            .for_each(|x| *x /= 1_000),
+        (ParquetTimeUnit::Nanoseconds, TimeUnit::Nanosecond) => {},
+    }
+}
+
+#[inline]
+fn deserialize_int64<I: TrustedLen<Item = Option<i64>>>(
+    iter: I,
+    primitive_type: &PrimitiveType,
+    data_type: DataType,
+) -> Box<dyn Array> {
+    use DataType::*;
+    match data_type.to_logical_type() {
+        UInt64 => Box::new(
+            PrimitiveArray::<u64>::from_trusted_len_iter(iter.map(|x| x.map(|x| x as u64)))
+                .to(data_type),
+        ) as _,
+        Decimal(_, _) => Box::new(
+            PrimitiveArray::<i128>::from_trusted_len_iter(iter.map(|x| x.map(|x| x as i128)))
+                .to(data_type),
+        ) as _,
+        Decimal256(_, _) => Box::new(
+            PrimitiveArray::<i256>::from_trusted_len_iter(
+                iter.map(|x| x.map(|x| i256(I256::new(x.into())))),
+            )
+            .to(data_type),
+        ) as _,
+        Timestamp(time_unit, _) => {
+            let mut array =
+                MutablePrimitiveArray::<i64>::from_trusted_len_iter(iter).to(data_type.clone());
+
+            timestamp(&mut array, *time_unit, primitive_type.logical_type);
+
+            let array: PrimitiveArray<i64> = array.into();
+
+            Box::new(array)
+        },
+        _ => Box::new(PrimitiveArray::<i64>::from_trusted_len_iter(iter).to(data_type)),
+    }
+}
+
+#[inline]
+fn deserialize_int96<I: TrustedLen<Item = Option<[u32; 3]>>>(
+    iter: I,
+    data_type: DataType,
+) -> Box<dyn Array> {
+    Box::new(
+        PrimitiveArray::<i64>::from_trusted_len_iter(iter.map(|x| x.map(int96_to_i64_ns)))
+            .to(data_type),
+    )
+}
+
+#[inline]
+fn deserialize_id_s<T: NativeType, I: TrustedLen<Item = Option<T>>>(
+    iter: I,
+    data_type: DataType,
+) -> Box<dyn Array> {
+    Box::new(PrimitiveArray::<T>::from_trusted_len_iter(iter).to(data_type))
+}
+
+pub fn deserialize_i32(indexes: &[PageIndex<i32>], data_type: DataType) -> ColumnPageStatistics {
+    ColumnPageStatistics {
+        min: deserialize_int32(indexes.iter().map(|index| index.min), data_type.clone()),
+        max: deserialize_int32(indexes.iter().map(|index| index.max), data_type),
+        null_count: PrimitiveArray::from_trusted_len_iter(
+            indexes
+                .iter()
+                .map(|index| index.null_count.map(|x| x as u64)),
+        ),
+    }
+}
+
+pub fn deserialize_i64(
+    indexes: &[PageIndex<i64>],
+    primitive_type: &PrimitiveType,
+    data_type: DataType,
+) -> ColumnPageStatistics {
+    ColumnPageStatistics {
+        min: deserialize_int64(
+            indexes.iter().map(|index| index.min),
+            primitive_type,
+            data_type.clone(),
+        ),
+        max: deserialize_int64(
+            indexes.iter().map(|index| index.max),
+            primitive_type,
+            data_type,
+        ),
+        null_count: PrimitiveArray::from_trusted_len_iter(
+            indexes
+                .iter()
+                .map(|index| index.null_count.map(|x| x as u64)),
+        ),
+    }
+}
+
+pub fn deserialize_i96(
+    indexes: &[PageIndex<[u32; 3]>],
+    data_type: DataType,
+) -> ColumnPageStatistics {
+    ColumnPageStatistics {
+        min: deserialize_int96(indexes.iter().map(|index| index.min), data_type.clone()),
+        max: deserialize_int96(indexes.iter().map(|index| index.max), data_type),
+        null_count: PrimitiveArray::from_trusted_len_iter(
+            indexes
+                .iter()
+                .map(|index| index.null_count.map(|x| x as u64)),
+        ),
+    }
+}
+
+pub fn deserialize_id<T: NativeType>(
+    indexes: &[PageIndex<T>],
+    data_type: DataType,
+) -> ColumnPageStatistics {
+    ColumnPageStatistics {
+        min: deserialize_id_s(indexes.iter().map(|index| index.min), data_type.clone()),
+        max: deserialize_id_s(indexes.iter().map(|index| index.max), data_type),
+        null_count: PrimitiveArray::from_trusted_len_iter(
+            indexes
+                .iter()
+                .map(|index| index.null_count.map(|x| x as u64)),
+        ),
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/mod.rs b/crates/nano-arrow/src/io/parquet/read/mod.rs
new file mode 100644
index 000000000000..52a4d07d922e
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/mod.rs
@@ -0,0 +1,95 @@
+//! APIs to read from Parquet format.
+#![allow(clippy::type_complexity)]
+
+mod deserialize;
+mod file;
+pub mod indexes;
+mod row_group;
+pub mod schema;
+pub mod statistics;
+
+use std::io::{Read, Seek};
+
+pub use deserialize::{
+    column_iter_to_arrays, create_list, create_map, get_page_iterator, init_nested, n_columns,
+    InitNested, NestedArrayIter, NestedState, StructIterator,
+};
+pub use file::{FileReader, RowGroupReader};
+use futures::{AsyncRead, AsyncSeek};
+// re-exports of parquet2's relevant APIs
+pub use parquet2::{
+    error::Error as ParquetError,
+    fallible_streaming_iterator,
+    metadata::{ColumnChunkMetaData, ColumnDescriptor, RowGroupMetaData},
+    page::{CompressedDataPage, DataPageHeader, Page},
+    read::{
+        decompress, get_column_iterator, get_page_stream,
+        read_columns_indexes as _read_columns_indexes, read_metadata as _read_metadata,
+        read_metadata_async as _read_metadata_async, read_pages_locations, BasicDecompressor,
+        Decompressor, MutStreamingIterator, PageFilter, PageReader, ReadColumnIterator, State,
+    },
+    schema::types::{
+        GroupLogicalType, ParquetType, PhysicalType, PrimitiveConvertedType, PrimitiveLogicalType,
+        TimeUnit as ParquetTimeUnit,
+    },
+    types::int96_to_i64_ns,
+    FallibleStreamingIterator,
+};
+pub use row_group::*;
+pub use schema::{infer_schema, FileMetaData};
+
+use crate::array::Array;
+use crate::error::Result;
+use crate::types::{i256, NativeType};
+
+/// Trait describing a [`FallibleStreamingIterator`] of [`Page`]
+pub trait Pages:
+    FallibleStreamingIterator<Item = Page, Error = ParquetError> + Send + Sync
+{
+}
+
+impl<I: FallibleStreamingIterator<Item = Page, Error = ParquetError> + Send + Sync> Pages for I {}
+
+/// Type def for a sharable, boxed dyn [`Iterator`] of arrays
+pub type ArrayIter<'a> = Box<dyn Iterator<Item = Result<Box<dyn Array>>> + Send + Sync + 'a>;
+
+/// Reads parquets' metadata synchronously.
+pub fn read_metadata<R: Read + Seek>(reader: &mut R) -> Result<FileMetaData> {
+    Ok(_read_metadata(reader)?)
+}
+
+/// Reads parquets' metadata asynchronously.
+pub async fn read_metadata_async<R: AsyncRead + AsyncSeek + Send + Unpin>(
+    reader: &mut R,
+) -> Result<FileMetaData> {
+    Ok(_read_metadata_async(reader).await?)
+}
+
+fn convert_days_ms(value: &[u8]) -> crate::types::days_ms {
+    crate::types::days_ms(
+        i32::from_le_bytes(value[4..8].try_into().unwrap()),
+        i32::from_le_bytes(value[8..12].try_into().unwrap()),
+    )
+}
+
+fn convert_i128(value: &[u8], n: usize) -> i128 {
+    // Copy the fixed-size byte value to the start of a 16 byte stack
+    // allocated buffer, then use an arithmetic right shift to fill in
+    // MSBs, which accounts for leading 1's in negative (two's complement)
+    // values.
+    let mut bytes = [0u8; 16];
+    bytes[..n].copy_from_slice(value);
+    i128::from_be_bytes(bytes) >> (8 * (16 - n))
+}
+
+fn convert_i256(value: &[u8]) -> i256 {
+    if value[0] >= 128 {
+        let mut neg_bytes = [255u8; 32];
+        neg_bytes[32 - value.len()..].copy_from_slice(value);
+        i256::from_be_bytes(neg_bytes)
+    } else {
+        let mut bytes = [0u8; 32];
+        bytes[32 - value.len()..].copy_from_slice(value);
+        i256::from_be_bytes(bytes)
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/row_group.rs b/crates/nano-arrow/src/io/parquet/read/row_group.rs
new file mode 100644
index 000000000000..0b72897c5ac6
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/row_group.rs
@@ -0,0 +1,339 @@
+use std::io::{Read, Seek};
+
+use futures::future::{try_join_all, BoxFuture};
+use futures::{AsyncRead, AsyncReadExt, AsyncSeek, AsyncSeekExt};
+use parquet2::indexes::FilteredPage;
+use parquet2::metadata::ColumnChunkMetaData;
+use parquet2::read::{BasicDecompressor, IndexedPageReader, PageMetaData, PageReader};
+
+use super::{ArrayIter, RowGroupMetaData};
+use crate::array::Array;
+use crate::chunk::Chunk;
+use crate::datatypes::Field;
+use crate::error::Result;
+use crate::io::parquet::read::column_iter_to_arrays;
+
+/// An [`Iterator`] of [`Chunk`] that (dynamically) adapts a vector of iterators of [`Array`] into
+/// an iterator of [`Chunk`].
+///
+/// This struct tracks advances each of the iterators individually and combines the
+/// result in a single [`Chunk`].
+///
+/// # Implementation
+/// This iterator is single-threaded and advancing it is CPU-bounded.
+pub struct RowGroupDeserializer {
+    num_rows: usize,
+    remaining_rows: usize,
+    column_chunks: Vec<ArrayIter<'static>>,
+}
+
+impl RowGroupDeserializer {
+    /// Creates a new [`RowGroupDeserializer`].
+    ///
+    /// # Panic
+    /// This function panics iff any of the `column_chunks`
+    /// do not return an array with an equal length.
+    pub fn new(
+        column_chunks: Vec<ArrayIter<'static>>,
+        num_rows: usize,
+        limit: Option<usize>,
+    ) -> Self {
+        Self {
+            num_rows,
+            remaining_rows: limit.unwrap_or(usize::MAX).min(num_rows),
+            column_chunks,
+        }
+    }
+
+    /// Returns the number of rows on this row group
+    pub fn num_rows(&self) -> usize {
+        self.num_rows
+    }
+}
+
+impl Iterator for RowGroupDeserializer {
+    type Item = Result<Chunk<Box<dyn Array>>>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        if self.remaining_rows == 0 {
+            return None;
+        }
+        let chunk = self
+            .column_chunks
+            .iter_mut()
+            .map(|iter| iter.next().unwrap())
+            .collect::<Result<Vec<_>>>()
+            .and_then(Chunk::try_new);
+        self.remaining_rows = self.remaining_rows.saturating_sub(
+            chunk
+                .as_ref()
+                .map(|x| x.len())
+                .unwrap_or(self.remaining_rows),
+        );
+
+        Some(chunk)
+    }
+}
+
+/// Returns all [`ColumnChunkMetaData`] associated to `field_name`.
+/// For non-nested parquet types, this returns a single column
+pub fn get_field_columns<'a>(
+    columns: &'a [ColumnChunkMetaData],
+    field_name: &str,
+) -> Vec<&'a ColumnChunkMetaData> {
+    columns
+        .iter()
+        .filter(|x| x.descriptor().path_in_schema[0] == field_name)
+        .collect()
+}
+
+/// Returns all [`ColumnChunkMetaData`] associated to `field_name`.
+/// For non-nested parquet types, this returns a single column
+pub fn get_field_pages<'a, T>(
+    columns: &'a [ColumnChunkMetaData],
+    items: &'a [T],
+    field_name: &str,
+) -> Vec<&'a T> {
+    columns
+        .iter()
+        .zip(items)
+        .filter(|(metadata, _)| metadata.descriptor().path_in_schema[0] == field_name)
+        .map(|(_, item)| item)
+        .collect()
+}
+
+/// Reads all columns that are part of the parquet field `field_name`
+/// # Implementation
+/// This operation is IO-bounded `O(C)` where C is the number of columns associated to
+/// the field (one for non-nested types)
+pub fn read_columns<'a, R: Read + Seek>(
+    reader: &mut R,
+    columns: &'a [ColumnChunkMetaData],
+    field_name: &str,
+) -> Result<Vec<(&'a ColumnChunkMetaData, Vec<u8>)>> {
+    get_field_columns(columns, field_name)
+        .into_iter()
+        .map(|meta| _read_single_column(reader, meta))
+        .collect()
+}
+
+fn _read_single_column<'a, R>(
+    reader: &mut R,
+    meta: &'a ColumnChunkMetaData,
+) -> Result<(&'a ColumnChunkMetaData, Vec<u8>)>
+where
+    R: Read + Seek,
+{
+    let (start, length) = meta.byte_range();
+    reader.seek(std::io::SeekFrom::Start(start))?;
+
+    let mut chunk = vec![];
+    chunk.try_reserve(length as usize)?;
+    reader.by_ref().take(length).read_to_end(&mut chunk)?;
+    Ok((meta, chunk))
+}
+
+async fn _read_single_column_async<'b, R, F>(
+    reader_factory: F,
+    meta: &ColumnChunkMetaData,
+) -> Result<(&ColumnChunkMetaData, Vec<u8>)>
+where
+    R: AsyncRead + AsyncSeek + Send + Unpin,
+    F: Fn() -> BoxFuture<'b, std::io::Result<R>>,
+{
+    let mut reader = reader_factory().await?;
+    let (start, length) = meta.byte_range();
+    reader.seek(std::io::SeekFrom::Start(start)).await?;
+
+    let mut chunk = vec![];
+    chunk.try_reserve(length as usize)?;
+    reader.take(length).read_to_end(&mut chunk).await?;
+    Result::Ok((meta, chunk))
+}
+
+/// Reads all columns that are part of the parquet field `field_name`
+/// # Implementation
+/// This operation is IO-bounded `O(C)` where C is the number of columns associated to
+/// the field (one for non-nested types)
+///
+/// It does so asynchronously via a single `join_all` over all the necessary columns for
+/// `field_name`.
+pub async fn read_columns_async<
+    'a,
+    'b,
+    R: AsyncRead + AsyncSeek + Send + Unpin,
+    F: Fn() -> BoxFuture<'b, std::io::Result<R>> + Clone,
+>(
+    reader_factory: F,
+    columns: &'a [ColumnChunkMetaData],
+    field_name: &str,
+) -> Result<Vec<(&'a ColumnChunkMetaData, Vec<u8>)>> {
+    let futures = get_field_columns(columns, field_name)
+        .into_iter()
+        .map(|meta| async { _read_single_column_async(reader_factory.clone(), meta).await });
+
+    try_join_all(futures).await
+}
+
+type Pages = Box<
+    dyn Iterator<Item = std::result::Result<parquet2::page::CompressedPage, parquet2::error::Error>>
+        + Sync
+        + Send,
+>;
+
+/// Converts a vector of columns associated with the parquet field whose name is [`Field`]
+/// to an iterator of [`Array`], [`ArrayIter`] of chunk size `chunk_size`.
+pub fn to_deserializer<'a>(
+    columns: Vec<(&ColumnChunkMetaData, Vec<u8>)>,
+    field: Field,
+    num_rows: usize,
+    chunk_size: Option<usize>,
+    pages: Option<Vec<Vec<FilteredPage>>>,
+) -> Result<ArrayIter<'a>> {
+    let chunk_size = chunk_size.map(|c| c.min(num_rows));
+
+    let (columns, types) = if let Some(pages) = pages {
+        let (columns, types): (Vec<_>, Vec<_>) = columns
+            .into_iter()
+            .zip(pages)
+            .map(|((column_meta, chunk), mut pages)| {
+                // de-offset the start, since we read in chunks (and offset is from start of file)
+                let mut meta: PageMetaData = column_meta.into();
+                pages
+                    .iter_mut()
+                    .for_each(|page| page.start -= meta.column_start);
+                meta.column_start = 0;
+                let pages = IndexedPageReader::new_with_page_meta(
+                    std::io::Cursor::new(chunk),
+                    meta,
+                    pages,
+                    vec![],
+                    vec![],
+                );
+                let pages = Box::new(pages) as Pages;
+                (
+                    BasicDecompressor::new(pages, vec![]),
+                    &column_meta.descriptor().descriptor.primitive_type,
+                )
+            })
+            .unzip();
+
+        (columns, types)
+    } else {
+        let (columns, types): (Vec<_>, Vec<_>) = columns
+            .into_iter()
+            .map(|(column_meta, chunk)| {
+                let len = chunk.len();
+                let pages = PageReader::new(
+                    std::io::Cursor::new(chunk),
+                    column_meta,
+                    std::sync::Arc::new(|_, _| true),
+                    vec![],
+                    len * 2 + 1024,
+                );
+                let pages = Box::new(pages) as Pages;
+                (
+                    BasicDecompressor::new(pages, vec![]),
+                    &column_meta.descriptor().descriptor.primitive_type,
+                )
+            })
+            .unzip();
+
+        (columns, types)
+    };
+
+    column_iter_to_arrays(columns, types, field, chunk_size, num_rows)
+}
+
+/// Returns a vector of iterators of [`Array`] ([`ArrayIter`]) corresponding to the top
+/// level parquet fields whose name matches `fields`'s names.
+///
+/// # Implementation
+/// This operation is IO-bounded `O(C)` where C is the number of columns in the row group -
+/// it reads all the columns to memory from the row group associated to the requested fields.
+///
+/// This operation is single-threaded. For readers with stronger invariants
+/// (e.g. implement [`Clone`]) you can use [`read_columns`] to read multiple columns at once
+/// and convert them to [`ArrayIter`] via [`to_deserializer`].
+pub fn read_columns_many<'a, R: Read + Seek>(
+    reader: &mut R,
+    row_group: &RowGroupMetaData,
+    fields: Vec<Field>,
+    chunk_size: Option<usize>,
+    limit: Option<usize>,
+    pages: Option<Vec<Vec<Vec<FilteredPage>>>>,
+) -> Result<Vec<ArrayIter<'a>>> {
+    let num_rows = row_group.num_rows();
+    let num_rows = limit.map(|limit| limit.min(num_rows)).unwrap_or(num_rows);
+
+    // reads all the necessary columns for all fields from the row group
+    // This operation is IO-bounded `O(C)` where C is the number of columns in the row group
+    let field_columns = fields
+        .iter()
+        .map(|field| read_columns(reader, row_group.columns(), &field.name))
+        .collect::<Result<Vec<_>>>()?;
+
+    if let Some(pages) = pages {
+        field_columns
+            .into_iter()
+            .zip(fields)
+            .zip(pages)
+            .map(|((columns, field), pages)| {
+                to_deserializer(columns, field, num_rows, chunk_size, Some(pages))
+            })
+            .collect()
+    } else {
+        field_columns
+            .into_iter()
+            .zip(fields)
+            .map(|(columns, field)| to_deserializer(columns, field, num_rows, chunk_size, None))
+            .collect()
+    }
+}
+
+/// Returns a vector of iterators of [`Array`] corresponding to the top level parquet fields whose
+/// name matches `fields`'s names.
+///
+/// # Implementation
+/// This operation is IO-bounded `O(C)` where C is the number of columns in the row group -
+/// it reads all the columns to memory from the row group associated to the requested fields.
+/// It does so asynchronously via `join_all`
+pub async fn read_columns_many_async<
+    'a,
+    'b,
+    R: AsyncRead + AsyncSeek + Send + Unpin,
+    F: Fn() -> BoxFuture<'b, std::io::Result<R>> + Clone,
+>(
+    reader_factory: F,
+    row_group: &RowGroupMetaData,
+    fields: Vec<Field>,
+    chunk_size: Option<usize>,
+    limit: Option<usize>,
+    pages: Option<Vec<Vec<Vec<FilteredPage>>>>,
+) -> Result<Vec<ArrayIter<'a>>> {
+    let num_rows = row_group.num_rows();
+    let num_rows = limit.map(|limit| limit.min(num_rows)).unwrap_or(num_rows);
+
+    let futures = fields
+        .iter()
+        .map(|field| read_columns_async(reader_factory.clone(), row_group.columns(), &field.name));
+
+    let field_columns = try_join_all(futures).await?;
+
+    if let Some(pages) = pages {
+        field_columns
+            .into_iter()
+            .zip(fields)
+            .zip(pages)
+            .map(|((columns, field), pages)| {
+                to_deserializer(columns, field, num_rows, chunk_size, Some(pages))
+            })
+            .collect()
+    } else {
+        field_columns
+            .into_iter()
+            .zip(fields.into_iter())
+            .map(|(columns, field)| to_deserializer(columns, field, num_rows, chunk_size, None))
+            .collect()
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/schema/convert.rs b/crates/nano-arrow/src/io/parquet/read/schema/convert.rs
new file mode 100644
index 000000000000..4ae50e05e8e0
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/schema/convert.rs
@@ -0,0 +1,1049 @@
+//! This module has entry points, [`parquet_to_arrow_schema`] and the more configurable [`parquet_to_arrow_schema_with_options`].
+use parquet2::schema::types::{
+    FieldInfo, GroupConvertedType, GroupLogicalType, IntegerType, ParquetType, PhysicalType,
+    PrimitiveConvertedType, PrimitiveLogicalType, PrimitiveType, TimeUnit as ParquetTimeUnit,
+};
+use parquet2::schema::Repetition;
+
+use crate::datatypes::{DataType, Field, IntervalUnit, TimeUnit};
+use crate::io::parquet::read::schema::SchemaInferenceOptions;
+
+/// Converts [`ParquetType`]s to a [`Field`], ignoring parquet fields that do not contain
+/// any physical column.
+pub fn parquet_to_arrow_schema(fields: &[ParquetType]) -> Vec<Field> {
+    parquet_to_arrow_schema_with_options(fields, &None)
+}
+
+/// Like [`parquet_to_arrow_schema`] but with configurable options which affect the behavior of schema inference
+pub fn parquet_to_arrow_schema_with_options(
+    fields: &[ParquetType],
+    options: &Option<SchemaInferenceOptions>,
+) -> Vec<Field> {
+    fields
+        .iter()
+        .filter_map(|f| to_field(f, options.as_ref().unwrap_or(&Default::default())))
+        .collect::<Vec<_>>()
+}
+
+fn from_int32(
+    logical_type: Option<PrimitiveLogicalType>,
+    converted_type: Option<PrimitiveConvertedType>,
+) -> DataType {
+    use PrimitiveLogicalType::*;
+    match (logical_type, converted_type) {
+        // handle logical types first
+        (Some(Integer(t)), _) => match t {
+            IntegerType::Int8 => DataType::Int8,
+            IntegerType::Int16 => DataType::Int16,
+            IntegerType::Int32 => DataType::Int32,
+            IntegerType::UInt8 => DataType::UInt8,
+            IntegerType::UInt16 => DataType::UInt16,
+            IntegerType::UInt32 => DataType::UInt32,
+            // The above are the only possible annotations for parquet's int32. Anything else
+            // is a deviation to the parquet specification and we ignore
+            _ => DataType::Int32,
+        },
+        (Some(Decimal(precision, scale)), _) => DataType::Decimal(precision, scale),
+        (Some(Date), _) => DataType::Date32,
+        (Some(Time { unit, .. }), _) => match unit {
+            ParquetTimeUnit::Milliseconds => DataType::Time32(TimeUnit::Millisecond),
+            // MILLIS is the only possible annotation for parquet's int32. Anything else
+            // is a deviation to the parquet specification and we ignore
+            _ => DataType::Int32,
+        },
+        // handle converted types:
+        (_, Some(PrimitiveConvertedType::Uint8)) => DataType::UInt8,
+        (_, Some(PrimitiveConvertedType::Uint16)) => DataType::UInt16,
+        (_, Some(PrimitiveConvertedType::Uint32)) => DataType::UInt32,
+        (_, Some(PrimitiveConvertedType::Int8)) => DataType::Int8,
+        (_, Some(PrimitiveConvertedType::Int16)) => DataType::Int16,
+        (_, Some(PrimitiveConvertedType::Int32)) => DataType::Int32,
+        (_, Some(PrimitiveConvertedType::Date)) => DataType::Date32,
+        (_, Some(PrimitiveConvertedType::TimeMillis)) => DataType::Time32(TimeUnit::Millisecond),
+        (_, Some(PrimitiveConvertedType::Decimal(precision, scale))) => {
+            DataType::Decimal(precision, scale)
+        },
+        (_, _) => DataType::Int32,
+    }
+}
+
+fn from_int64(
+    logical_type: Option<PrimitiveLogicalType>,
+    converted_type: Option<PrimitiveConvertedType>,
+) -> DataType {
+    use PrimitiveLogicalType::*;
+    match (logical_type, converted_type) {
+        // handle logical types first
+        (Some(Integer(integer)), _) => match integer {
+            IntegerType::UInt64 => DataType::UInt64,
+            IntegerType::Int64 => DataType::Int64,
+            _ => DataType::Int64,
+        },
+        (
+            Some(Timestamp {
+                is_adjusted_to_utc,
+                unit,
+            }),
+            _,
+        ) => {
+            let timezone = if is_adjusted_to_utc {
+                // https://github.com/apache/parquet-format/blob/master/LogicalTypes.md
+                // A TIMESTAMP with isAdjustedToUTC=true is defined as [...] elapsed since the Unix epoch
+                Some("+00:00".to_string())
+            } else {
+                // PARQUET:
+                // https://github.com/apache/parquet-format/blob/master/LogicalTypes.md
+                // A TIMESTAMP with isAdjustedToUTC=false represents [...] such
+                // timestamps should always be displayed the same way, regardless of the local time zone in effect
+                // ARROW:
+                // https://github.com/apache/parquet-format/blob/master/LogicalTypes.md
+                // If the time zone is null or equal to an empty string, the data is "time
+                // zone naive" and shall be displayed *as is* to the user, not localized
+                // to the locale of the user.
+                None
+            };
+
+            match unit {
+                ParquetTimeUnit::Milliseconds => {
+                    DataType::Timestamp(TimeUnit::Millisecond, timezone)
+                },
+                ParquetTimeUnit::Microseconds => {
+                    DataType::Timestamp(TimeUnit::Microsecond, timezone)
+                },
+                ParquetTimeUnit::Nanoseconds => DataType::Timestamp(TimeUnit::Nanosecond, timezone),
+            }
+        },
+        (Some(Time { unit, .. }), _) => match unit {
+            ParquetTimeUnit::Microseconds => DataType::Time64(TimeUnit::Microsecond),
+            ParquetTimeUnit::Nanoseconds => DataType::Time64(TimeUnit::Nanosecond),
+            // MILLIS is only possible for int32. Appearing in int64 is a deviation
+            // to parquet's spec, which we ignore
+            _ => DataType::Int64,
+        },
+        (Some(Decimal(precision, scale)), _) => DataType::Decimal(precision, scale),
+        // handle converted types:
+        (_, Some(PrimitiveConvertedType::TimeMicros)) => DataType::Time64(TimeUnit::Microsecond),
+        (_, Some(PrimitiveConvertedType::TimestampMillis)) => {
+            DataType::Timestamp(TimeUnit::Millisecond, None)
+        },
+        (_, Some(PrimitiveConvertedType::TimestampMicros)) => {
+            DataType::Timestamp(TimeUnit::Microsecond, None)
+        },
+        (_, Some(PrimitiveConvertedType::Int64)) => DataType::Int64,
+        (_, Some(PrimitiveConvertedType::Uint64)) => DataType::UInt64,
+        (_, Some(PrimitiveConvertedType::Decimal(precision, scale))) => {
+            DataType::Decimal(precision, scale)
+        },
+
+        (_, _) => DataType::Int64,
+    }
+}
+
+fn from_byte_array(
+    logical_type: &Option<PrimitiveLogicalType>,
+    converted_type: &Option<PrimitiveConvertedType>,
+) -> DataType {
+    match (logical_type, converted_type) {
+        (Some(PrimitiveLogicalType::String), _) => DataType::Utf8,
+        (Some(PrimitiveLogicalType::Json), _) => DataType::Binary,
+        (Some(PrimitiveLogicalType::Bson), _) => DataType::Binary,
+        (Some(PrimitiveLogicalType::Enum), _) => DataType::Binary,
+        (_, Some(PrimitiveConvertedType::Json)) => DataType::Binary,
+        (_, Some(PrimitiveConvertedType::Bson)) => DataType::Binary,
+        (_, Some(PrimitiveConvertedType::Enum)) => DataType::Binary,
+        (_, Some(PrimitiveConvertedType::Utf8)) => DataType::Utf8,
+        (_, _) => DataType::Binary,
+    }
+}
+
+fn from_fixed_len_byte_array(
+    length: usize,
+    logical_type: Option<PrimitiveLogicalType>,
+    converted_type: Option<PrimitiveConvertedType>,
+) -> DataType {
+    match (logical_type, converted_type) {
+        (Some(PrimitiveLogicalType::Decimal(precision, scale)), _) => {
+            DataType::Decimal(precision, scale)
+        },
+        (None, Some(PrimitiveConvertedType::Decimal(precision, scale))) => {
+            DataType::Decimal(precision, scale)
+        },
+        (None, Some(PrimitiveConvertedType::Interval)) => {
+            // There is currently no reliable way of determining which IntervalUnit
+            // to return. Thus without the original Arrow schema, the results
+            // would be incorrect if all 12 bytes of the interval are populated
+            DataType::Interval(IntervalUnit::DayTime)
+        },
+        _ => DataType::FixedSizeBinary(length),
+    }
+}
+
+/// Maps a [`PhysicalType`] with optional metadata to a [`DataType`]
+fn to_primitive_type_inner(
+    primitive_type: &PrimitiveType,
+    options: &SchemaInferenceOptions,
+) -> DataType {
+    match primitive_type.physical_type {
+        PhysicalType::Boolean => DataType::Boolean,
+        PhysicalType::Int32 => {
+            from_int32(primitive_type.logical_type, primitive_type.converted_type)
+        },
+        PhysicalType::Int64 => {
+            from_int64(primitive_type.logical_type, primitive_type.converted_type)
+        },
+        PhysicalType::Int96 => DataType::Timestamp(options.int96_coerce_to_timeunit, None),
+        PhysicalType::Float => DataType::Float32,
+        PhysicalType::Double => DataType::Float64,
+        PhysicalType::ByteArray => {
+            from_byte_array(&primitive_type.logical_type, &primitive_type.converted_type)
+        },
+        PhysicalType::FixedLenByteArray(length) => from_fixed_len_byte_array(
+            length,
+            primitive_type.logical_type,
+            primitive_type.converted_type,
+        ),
+    }
+}
+
+/// Entry point for converting parquet primitive type to arrow type.
+///
+/// This function takes care of repetition.
+fn to_primitive_type(primitive_type: &PrimitiveType, options: &SchemaInferenceOptions) -> DataType {
+    let base_type = to_primitive_type_inner(primitive_type, options);
+
+    if primitive_type.field_info.repetition == Repetition::Repeated {
+        DataType::List(Box::new(Field::new(
+            &primitive_type.field_info.name,
+            base_type,
+            is_nullable(&primitive_type.field_info),
+        )))
+    } else {
+        base_type
+    }
+}
+
+fn non_repeated_group(
+    logical_type: &Option<GroupLogicalType>,
+    converted_type: &Option<GroupConvertedType>,
+    fields: &[ParquetType],
+    parent_name: &str,
+    options: &SchemaInferenceOptions,
+) -> Option<DataType> {
+    debug_assert!(!fields.is_empty());
+    match (logical_type, converted_type) {
+        (Some(GroupLogicalType::List), _) => to_list(fields, parent_name, options),
+        (None, Some(GroupConvertedType::List)) => to_list(fields, parent_name, options),
+        (Some(GroupLogicalType::Map), _) => to_list(fields, parent_name, options),
+        (None, Some(GroupConvertedType::Map) | Some(GroupConvertedType::MapKeyValue)) => {
+            to_map(fields, options)
+        },
+        _ => to_struct(fields, options),
+    }
+}
+
+/// Converts a parquet group type to an arrow [`DataType::Struct`].
+/// Returns [`None`] if all its fields are empty
+fn to_struct(fields: &[ParquetType], options: &SchemaInferenceOptions) -> Option<DataType> {
+    let fields = fields
+        .iter()
+        .filter_map(|f| to_field(f, options))
+        .collect::<Vec<Field>>();
+    if fields.is_empty() {
+        None
+    } else {
+        Some(DataType::Struct(fields))
+    }
+}
+
+/// Converts a parquet group type to an arrow [`DataType::Struct`].
+/// Returns [`None`] if all its fields are empty
+fn to_map(fields: &[ParquetType], options: &SchemaInferenceOptions) -> Option<DataType> {
+    let inner = to_field(&fields[0], options)?;
+    Some(DataType::Map(Box::new(inner), false))
+}
+
+/// Entry point for converting parquet group type.
+///
+/// This function takes care of logical type and repetition.
+fn to_group_type(
+    field_info: &FieldInfo,
+    logical_type: &Option<GroupLogicalType>,
+    converted_type: &Option<GroupConvertedType>,
+    fields: &[ParquetType],
+    parent_name: &str,
+    options: &SchemaInferenceOptions,
+) -> Option<DataType> {
+    debug_assert!(!fields.is_empty());
+    if field_info.repetition == Repetition::Repeated {
+        Some(DataType::List(Box::new(Field::new(
+            &field_info.name,
+            to_struct(fields, options)?,
+            is_nullable(field_info),
+        ))))
+    } else {
+        non_repeated_group(logical_type, converted_type, fields, parent_name, options)
+    }
+}
+
+/// Checks whether this schema is nullable.
+pub(crate) fn is_nullable(field_info: &FieldInfo) -> bool {
+    match field_info.repetition {
+        Repetition::Optional => true,
+        Repetition::Repeated => true,
+        Repetition::Required => false,
+    }
+}
+
+/// Converts parquet schema to arrow field.
+/// Returns `None` iff the parquet type has no associated primitive types,
+/// i.e. if it is a column-less group type.
+fn to_field(type_: &ParquetType, options: &SchemaInferenceOptions) -> Option<Field> {
+    Some(Field::new(
+        &type_.get_field_info().name,
+        to_data_type(type_, options)?,
+        is_nullable(type_.get_field_info()),
+    ))
+}
+
+/// Converts a parquet list to arrow list.
+///
+/// To fully understand this algorithm, please refer to
+/// [parquet doc](https://github.com/apache/parquet-format/blob/master/LogicalTypes.md).
+fn to_list(
+    fields: &[ParquetType],
+    parent_name: &str,
+    options: &SchemaInferenceOptions,
+) -> Option<DataType> {
+    let item = fields.first().unwrap();
+
+    let item_type = match item {
+        ParquetType::PrimitiveType(primitive) => Some(to_primitive_type_inner(primitive, options)),
+        ParquetType::GroupType { fields, .. } => {
+            if fields.len() == 1
+                && item.name() != "array"
+                && item.name() != format!("{parent_name}_tuple")
+            {
+                // extract the repetition field
+                let nested_item = fields.first().unwrap();
+                to_data_type(nested_item, options)
+            } else {
+                to_struct(fields, options)
+            }
+        },
+    }?;
+
+    // Check that the name of the list child is "list", in which case we
+    // get the child nullability and name (normally "element") from the nested
+    // group type.
+    // Without this step, the child incorrectly inherits the parent's optionality
+    let (list_item_name, item_is_optional) = match item {
+        ParquetType::GroupType {
+            field_info, fields, ..
+        } if field_info.name == "list" && fields.len() == 1 => {
+            let field = fields.first().unwrap();
+            (
+                &field.get_field_info().name,
+                field.get_field_info().repetition != Repetition::Required,
+            )
+        },
+        _ => (
+            &item.get_field_info().name,
+            item.get_field_info().repetition != Repetition::Required,
+        ),
+    };
+
+    Some(DataType::List(Box::new(Field::new(
+        list_item_name,
+        item_type,
+        item_is_optional,
+    ))))
+}
+
+/// Converts parquet schema to arrow data type.
+///
+/// This function discards schema name.
+///
+/// If this schema is a primitive type and not included in the leaves, the result is
+/// Ok(None).
+///
+/// If this schema is a group type and none of its children is reserved in the
+/// conversion, the result is Ok(None).
+pub(crate) fn to_data_type(
+    type_: &ParquetType,
+    options: &SchemaInferenceOptions,
+) -> Option<DataType> {
+    match type_ {
+        ParquetType::PrimitiveType(primitive) => Some(to_primitive_type(primitive, options)),
+        ParquetType::GroupType {
+            field_info,
+            logical_type,
+            converted_type,
+            fields,
+        } => {
+            if fields.is_empty() {
+                None
+            } else {
+                to_group_type(
+                    field_info,
+                    logical_type,
+                    converted_type,
+                    fields,
+                    &field_info.name,
+                    options,
+                )
+            }
+        },
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use parquet2::metadata::SchemaDescriptor;
+
+    use super::*;
+    use crate::datatypes::{DataType, Field, TimeUnit};
+    use crate::error::Result;
+
+    #[test]
+    fn test_flat_primitives() -> Result<()> {
+        let message = "
+        message test_schema {
+            REQUIRED BOOLEAN boolean;
+            REQUIRED INT32   int8  (INT_8);
+            REQUIRED INT32   int16 (INT_16);
+            REQUIRED INT32   uint8 (INTEGER(8,false));
+            REQUIRED INT32   uint16 (INTEGER(16,false));
+            REQUIRED INT32   int32;
+            REQUIRED INT64   int64 ;
+            OPTIONAL DOUBLE  double;
+            OPTIONAL FLOAT   float;
+            OPTIONAL BINARY  string (UTF8);
+            OPTIONAL BINARY  string_2 (STRING);
+        }
+        ";
+        let expected = &[
+            Field::new("boolean", DataType::Boolean, false),
+            Field::new("int8", DataType::Int8, false),
+            Field::new("int16", DataType::Int16, false),
+            Field::new("uint8", DataType::UInt8, false),
+            Field::new("uint16", DataType::UInt16, false),
+            Field::new("int32", DataType::Int32, false),
+            Field::new("int64", DataType::Int64, false),
+            Field::new("double", DataType::Float64, true),
+            Field::new("float", DataType::Float32, true),
+            Field::new("string", DataType::Utf8, true),
+            Field::new("string_2", DataType::Utf8, true),
+        ];
+
+        let parquet_schema = SchemaDescriptor::try_from_message(message)?;
+        let fields = parquet_to_arrow_schema(parquet_schema.fields());
+
+        assert_eq!(fields, expected);
+        Ok(())
+    }
+
+    #[test]
+    fn test_byte_array_fields() -> Result<()> {
+        let message = "
+        message test_schema {
+            REQUIRED BYTE_ARRAY binary;
+            REQUIRED FIXED_LEN_BYTE_ARRAY (20) fixed_binary;
+        }
+        ";
+        let expected = vec![
+            Field::new("binary", DataType::Binary, false),
+            Field::new("fixed_binary", DataType::FixedSizeBinary(20), false),
+        ];
+
+        let parquet_schema = SchemaDescriptor::try_from_message(message)?;
+        let fields = parquet_to_arrow_schema(parquet_schema.fields());
+
+        assert_eq!(fields, expected);
+        Ok(())
+    }
+
+    #[test]
+    fn test_duplicate_fields() -> Result<()> {
+        let message = "
+        message test_schema {
+            REQUIRED BOOLEAN boolean;
+            REQUIRED INT32 int8 (INT_8);
+        }
+        ";
+        let expected = &[
+            Field::new("boolean", DataType::Boolean, false),
+            Field::new("int8", DataType::Int8, false),
+        ];
+
+        let parquet_schema = SchemaDescriptor::try_from_message(message)?;
+        let fields = parquet_to_arrow_schema(parquet_schema.fields());
+
+        assert_eq!(fields, expected);
+        Ok(())
+    }
+
+    #[test]
+    fn test_parquet_lists() -> Result<()> {
+        let mut arrow_fields = Vec::new();
+
+        // LIST encoding example taken from parquet-format/LogicalTypes.md
+        let message_type = "
+        message test_schema {
+          REQUIRED GROUP my_list (LIST) {
+            REPEATED GROUP list {
+              OPTIONAL BINARY element (UTF8);
+            }
+          }
+          OPTIONAL GROUP my_list (LIST) {
+            REPEATED GROUP list {
+              REQUIRED BINARY element (UTF8);
+            }
+          }
+          OPTIONAL GROUP array_of_arrays (LIST) {
+            REPEATED GROUP list {
+              REQUIRED GROUP element (LIST) {
+                REPEATED GROUP list {
+                  REQUIRED INT32 element;
+                }
+              }
+            }
+          }
+          OPTIONAL GROUP my_list (LIST) {
+            REPEATED GROUP element {
+              REQUIRED BINARY str (UTF8);
+            }
+          }
+          OPTIONAL GROUP my_list (LIST) {
+            REPEATED INT32 element;
+          }
+          OPTIONAL GROUP my_list (LIST) {
+            REPEATED GROUP element {
+              REQUIRED BINARY str (UTF8);
+              REQUIRED INT32 num;
+            }
+          }
+          OPTIONAL GROUP my_list (LIST) {
+            REPEATED GROUP array {
+              REQUIRED BINARY str (UTF8);
+            }
+
+          }
+          OPTIONAL GROUP my_list (LIST) {
+            REPEATED GROUP my_list_tuple {
+              REQUIRED BINARY str (UTF8);
+            }
+          }
+          REPEATED INT32 name;
+        }
+        ";
+
+        // // List<String> (list non-null, elements nullable)
+        // required group my_list (LIST) {
+        //   repeated group list {
+        //     optional binary element (UTF8);
+        //   }
+        // }
+        {
+            arrow_fields.push(Field::new(
+                "my_list",
+                DataType::List(Box::new(Field::new("element", DataType::Utf8, true))),
+                false,
+            ));
+        }
+
+        // // List<String> (list nullable, elements non-null)
+        // optional group my_list (LIST) {
+        //   repeated group list {
+        //     required binary element (UTF8);
+        //   }
+        // }
+        {
+            arrow_fields.push(Field::new(
+                "my_list",
+                DataType::List(Box::new(Field::new("element", DataType::Utf8, false))),
+                true,
+            ));
+        }
+
+        // Element types can be nested structures. For example, a list of lists:
+        //
+        // // List<List<Integer>>
+        // optional group array_of_arrays (LIST) {
+        //   repeated group list {
+        //     required group element (LIST) {
+        //       repeated group list {
+        //         required int32 element;
+        //       }
+        //     }
+        //   }
+        // }
+        {
+            let arrow_inner_list =
+                DataType::List(Box::new(Field::new("element", DataType::Int32, false)));
+            arrow_fields.push(Field::new(
+                "array_of_arrays",
+                DataType::List(Box::new(Field::new("element", arrow_inner_list, false))),
+                true,
+            ));
+        }
+
+        // // List<String> (list nullable, elements non-null)
+        // optional group my_list (LIST) {
+        //   repeated group element {
+        //     required binary str (UTF8);
+        //   };
+        // }
+        {
+            arrow_fields.push(Field::new(
+                "my_list",
+                DataType::List(Box::new(Field::new("element", DataType::Utf8, true))),
+                true,
+            ));
+        }
+
+        // // List<Integer> (nullable list, non-null elements)
+        // optional group my_list (LIST) {
+        //   repeated int32 element;
+        // }
+        {
+            arrow_fields.push(Field::new(
+                "my_list",
+                DataType::List(Box::new(Field::new("element", DataType::Int32, true))),
+                true,
+            ));
+        }
+
+        // // List<Tuple<String, Integer>> (nullable list, non-null elements)
+        // optional group my_list (LIST) {
+        //   repeated group element {
+        //     required binary str (UTF8);
+        //     required int32 num;
+        //   };
+        // }
+        {
+            let arrow_struct = DataType::Struct(vec![
+                Field::new("str", DataType::Utf8, false),
+                Field::new("num", DataType::Int32, false),
+            ]);
+            arrow_fields.push(Field::new(
+                "my_list",
+                DataType::List(Box::new(Field::new("element", arrow_struct, true))),
+                true,
+            ));
+        }
+
+        // // List<OneTuple<String>> (nullable list, non-null elements)
+        // optional group my_list (LIST) {
+        //   repeated group array {
+        //     required binary str (UTF8);
+        //   };
+        // }
+        // Special case: group is named array
+        {
+            let arrow_struct = DataType::Struct(vec![Field::new("str", DataType::Utf8, false)]);
+            arrow_fields.push(Field::new(
+                "my_list",
+                DataType::List(Box::new(Field::new("array", arrow_struct, true))),
+                true,
+            ));
+        }
+
+        // // List<OneTuple<String>> (nullable list, non-null elements)
+        // optional group my_list (LIST) {
+        //   repeated group my_list_tuple {
+        //     required binary str (UTF8);
+        //   };
+        // }
+        // Special case: group named ends in _tuple
+        {
+            let arrow_struct = DataType::Struct(vec![Field::new("str", DataType::Utf8, false)]);
+            arrow_fields.push(Field::new(
+                "my_list",
+                DataType::List(Box::new(Field::new("my_list_tuple", arrow_struct, true))),
+                true,
+            ));
+        }
+
+        // One-level encoding: Only allows required lists with required cells
+        //   repeated value_type name
+        {
+            arrow_fields.push(Field::new(
+                "name",
+                DataType::List(Box::new(Field::new("name", DataType::Int32, true))),
+                true,
+            ));
+        }
+
+        let parquet_schema = SchemaDescriptor::try_from_message(message_type)?;
+        let fields = parquet_to_arrow_schema(parquet_schema.fields());
+
+        assert_eq!(arrow_fields, fields);
+        Ok(())
+    }
+
+    #[test]
+    fn test_parquet_list_nullable() -> Result<()> {
+        let mut arrow_fields = Vec::new();
+
+        let message_type = "
+        message test_schema {
+          REQUIRED GROUP my_list1 (LIST) {
+            REPEATED GROUP list {
+              OPTIONAL BINARY element (UTF8);
+            }
+          }
+          OPTIONAL GROUP my_list2 (LIST) {
+            REPEATED GROUP list {
+              REQUIRED BINARY element (UTF8);
+            }
+          }
+          REQUIRED GROUP my_list3 (LIST) {
+            REPEATED GROUP list {
+              REQUIRED BINARY element (UTF8);
+            }
+          }
+        }
+        ";
+
+        // // List<String> (list non-null, elements nullable)
+        // required group my_list1 (LIST) {
+        //   repeated group list {
+        //     optional binary element (UTF8);
+        //   }
+        // }
+        {
+            arrow_fields.push(Field::new(
+                "my_list1",
+                DataType::List(Box::new(Field::new("element", DataType::Utf8, true))),
+                false,
+            ));
+        }
+
+        // // List<String> (list nullable, elements non-null)
+        // optional group my_list2 (LIST) {
+        //   repeated group list {
+        //     required binary element (UTF8);
+        //   }
+        // }
+        {
+            arrow_fields.push(Field::new(
+                "my_list2",
+                DataType::List(Box::new(Field::new("element", DataType::Utf8, false))),
+                true,
+            ));
+        }
+
+        // // List<String> (list non-null, elements non-null)
+        // repeated group my_list3 (LIST) {
+        //   repeated group list {
+        //     required binary element (UTF8);
+        //   }
+        // }
+        {
+            arrow_fields.push(Field::new(
+                "my_list3",
+                DataType::List(Box::new(Field::new("element", DataType::Utf8, false))),
+                false,
+            ));
+        }
+
+        let parquet_schema = SchemaDescriptor::try_from_message(message_type)?;
+        let fields = parquet_to_arrow_schema(parquet_schema.fields());
+
+        assert_eq!(arrow_fields, fields);
+        Ok(())
+    }
+
+    #[test]
+    fn test_nested_schema() -> Result<()> {
+        let mut arrow_fields = Vec::new();
+        {
+            let group1_fields = vec![
+                Field::new("leaf1", DataType::Boolean, false),
+                Field::new("leaf2", DataType::Int32, false),
+            ];
+            let group1_struct = Field::new("group1", DataType::Struct(group1_fields), false);
+            arrow_fields.push(group1_struct);
+
+            let leaf3_field = Field::new("leaf3", DataType::Int64, false);
+            arrow_fields.push(leaf3_field);
+        }
+
+        let message_type = "
+        message test_schema {
+          REQUIRED GROUP group1 {
+            REQUIRED BOOLEAN leaf1;
+            REQUIRED INT32 leaf2;
+          }
+          REQUIRED INT64 leaf3;
+        }
+        ";
+
+        let parquet_schema = SchemaDescriptor::try_from_message(message_type)?;
+        let fields = parquet_to_arrow_schema(parquet_schema.fields());
+
+        assert_eq!(arrow_fields, fields);
+        Ok(())
+    }
+
+    #[test]
+    fn test_repeated_nested_schema() -> Result<()> {
+        let mut arrow_fields = Vec::new();
+        {
+            arrow_fields.push(Field::new("leaf1", DataType::Int32, true));
+
+            let inner_group_list = Field::new(
+                "innerGroup",
+                DataType::List(Box::new(Field::new(
+                    "innerGroup",
+                    DataType::Struct(vec![Field::new("leaf3", DataType::Int32, true)]),
+                    true,
+                ))),
+                true,
+            );
+
+            let outer_group_list = Field::new(
+                "outerGroup",
+                DataType::List(Box::new(Field::new(
+                    "outerGroup",
+                    DataType::Struct(vec![
+                        Field::new("leaf2", DataType::Int32, true),
+                        inner_group_list,
+                    ]),
+                    true,
+                ))),
+                true,
+            );
+            arrow_fields.push(outer_group_list);
+        }
+
+        let message_type = "
+        message test_schema {
+          OPTIONAL INT32 leaf1;
+          REPEATED GROUP outerGroup {
+            OPTIONAL INT32 leaf2;
+            REPEATED GROUP innerGroup {
+              OPTIONAL INT32 leaf3;
+            }
+          }
+        }
+        ";
+
+        let parquet_schema = SchemaDescriptor::try_from_message(message_type)?;
+        let fields = parquet_to_arrow_schema(parquet_schema.fields());
+
+        assert_eq!(arrow_fields, fields);
+        Ok(())
+    }
+
+    #[test]
+    fn test_column_desc_to_field() -> Result<()> {
+        let message_type = "
+        message test_schema {
+            REQUIRED BOOLEAN boolean;
+            REQUIRED INT32   int8  (INT_8);
+            REQUIRED INT32   uint8 (INTEGER(8,false));
+            REQUIRED INT32   int16 (INT_16);
+            REQUIRED INT32   uint16 (INTEGER(16,false));
+            REQUIRED INT32   int32;
+            REQUIRED INT64   int64;
+            OPTIONAL DOUBLE  double;
+            OPTIONAL FLOAT   float;
+            OPTIONAL BINARY  string (UTF8);
+            REPEATED BOOLEAN bools;
+            OPTIONAL INT32   date       (DATE);
+            OPTIONAL INT32   time_milli (TIME_MILLIS);
+            OPTIONAL INT64   time_micro (TIME_MICROS);
+            OPTIONAL INT64   time_nano (TIME(NANOS,false));
+            OPTIONAL INT64   ts_milli (TIMESTAMP_MILLIS);
+            REQUIRED INT64   ts_micro (TIMESTAMP_MICROS);
+            REQUIRED INT64   ts_nano (TIMESTAMP(NANOS,true));
+        }
+        ";
+        let arrow_fields = vec![
+            Field::new("boolean", DataType::Boolean, false),
+            Field::new("int8", DataType::Int8, false),
+            Field::new("uint8", DataType::UInt8, false),
+            Field::new("int16", DataType::Int16, false),
+            Field::new("uint16", DataType::UInt16, false),
+            Field::new("int32", DataType::Int32, false),
+            Field::new("int64", DataType::Int64, false),
+            Field::new("double", DataType::Float64, true),
+            Field::new("float", DataType::Float32, true),
+            Field::new("string", DataType::Utf8, true),
+            Field::new(
+                "bools",
+                DataType::List(Box::new(Field::new("bools", DataType::Boolean, true))),
+                true,
+            ),
+            Field::new("date", DataType::Date32, true),
+            Field::new("time_milli", DataType::Time32(TimeUnit::Millisecond), true),
+            Field::new("time_micro", DataType::Time64(TimeUnit::Microsecond), true),
+            Field::new("time_nano", DataType::Time64(TimeUnit::Nanosecond), true),
+            Field::new(
+                "ts_milli",
+                DataType::Timestamp(TimeUnit::Millisecond, None),
+                true,
+            ),
+            Field::new(
+                "ts_micro",
+                DataType::Timestamp(TimeUnit::Microsecond, None),
+                false,
+            ),
+            Field::new(
+                "ts_nano",
+                DataType::Timestamp(TimeUnit::Nanosecond, Some("+00:00".to_string())),
+                false,
+            ),
+        ];
+
+        let parquet_schema = SchemaDescriptor::try_from_message(message_type)?;
+        let fields = parquet_to_arrow_schema(parquet_schema.fields());
+
+        assert_eq!(arrow_fields, fields);
+        Ok(())
+    }
+
+    #[test]
+    fn test_field_to_column_desc() -> Result<()> {
+        let message_type = "
+        message arrow_schema {
+            REQUIRED BOOLEAN boolean;
+            REQUIRED INT32   int8  (INT_8);
+            REQUIRED INT32   int16 (INTEGER(16,true));
+            REQUIRED INT32   int32;
+            REQUIRED INT64   int64;
+            OPTIONAL DOUBLE  double;
+            OPTIONAL FLOAT   float;
+            OPTIONAL BINARY  string (STRING);
+            OPTIONAL GROUP   bools (LIST) {
+                REPEATED GROUP list {
+                    OPTIONAL BOOLEAN element;
+                }
+            }
+            REQUIRED GROUP   bools_non_null (LIST) {
+                REPEATED GROUP list {
+                    REQUIRED BOOLEAN element;
+                }
+            }
+            OPTIONAL INT32   date       (DATE);
+            OPTIONAL INT32   time_milli (TIME(MILLIS,false));
+            OPTIONAL INT64   time_micro (TIME_MICROS);
+            OPTIONAL INT64   ts_milli (TIMESTAMP_MILLIS);
+            REQUIRED INT64   ts_micro (TIMESTAMP(MICROS,false));
+            REQUIRED GROUP struct {
+                REQUIRED BOOLEAN bools;
+                REQUIRED INT32 uint32 (INTEGER(32,false));
+                REQUIRED GROUP   int32 (LIST) {
+                    REPEATED GROUP list {
+                        OPTIONAL INT32 element;
+                    }
+                }
+            }
+            REQUIRED BINARY  dictionary_strings (STRING);
+        }
+        ";
+
+        let arrow_fields = vec![
+            Field::new("boolean", DataType::Boolean, false),
+            Field::new("int8", DataType::Int8, false),
+            Field::new("int16", DataType::Int16, false),
+            Field::new("int32", DataType::Int32, false),
+            Field::new("int64", DataType::Int64, false),
+            Field::new("double", DataType::Float64, true),
+            Field::new("float", DataType::Float32, true),
+            Field::new("string", DataType::Utf8, true),
+            Field::new(
+                "bools",
+                DataType::List(Box::new(Field::new("element", DataType::Boolean, true))),
+                true,
+            ),
+            Field::new(
+                "bools_non_null",
+                DataType::List(Box::new(Field::new("element", DataType::Boolean, false))),
+                false,
+            ),
+            Field::new("date", DataType::Date32, true),
+            Field::new("time_milli", DataType::Time32(TimeUnit::Millisecond), true),
+            Field::new("time_micro", DataType::Time64(TimeUnit::Microsecond), true),
+            Field::new(
+                "ts_milli",
+                DataType::Timestamp(TimeUnit::Millisecond, None),
+                true,
+            ),
+            Field::new(
+                "ts_micro",
+                DataType::Timestamp(TimeUnit::Microsecond, None),
+                false,
+            ),
+            Field::new(
+                "struct",
+                DataType::Struct(vec![
+                    Field::new("bools", DataType::Boolean, false),
+                    Field::new("uint32", DataType::UInt32, false),
+                    Field::new(
+                        "int32",
+                        DataType::List(Box::new(Field::new("element", DataType::Int32, true))),
+                        false,
+                    ),
+                ]),
+                false,
+            ),
+            Field::new("dictionary_strings", DataType::Utf8, false),
+        ];
+
+        let parquet_schema = SchemaDescriptor::try_from_message(message_type)?;
+        let fields = parquet_to_arrow_schema(parquet_schema.fields());
+
+        assert_eq!(arrow_fields, fields);
+        Ok(())
+    }
+
+    #[test]
+    fn test_int96_options() -> Result<()> {
+        for tu in [
+            TimeUnit::Second,
+            TimeUnit::Microsecond,
+            TimeUnit::Millisecond,
+            TimeUnit::Nanosecond,
+        ] {
+            let message_type = "
+            message arrow_schema {
+                REQUIRED INT96   int96_field;
+                OPTIONAL GROUP   int96_list (LIST) {
+                    REPEATED GROUP list {
+                        OPTIONAL INT96 element;
+                    }
+                }
+                REQUIRED GROUP int96_struct {
+                    REQUIRED INT96 int96_field;
+                }
+            }
+            ";
+            let coerced_to = DataType::Timestamp(tu, None);
+            let arrow_fields = vec![
+                Field::new("int96_field", coerced_to.clone(), false),
+                Field::new(
+                    "int96_list",
+                    DataType::List(Box::new(Field::new("element", coerced_to.clone(), true))),
+                    true,
+                ),
+                Field::new(
+                    "int96_struct",
+                    DataType::Struct(vec![Field::new("int96_field", coerced_to.clone(), false)]),
+                    false,
+                ),
+            ];
+
+            let parquet_schema = SchemaDescriptor::try_from_message(message_type)?;
+            let fields = parquet_to_arrow_schema_with_options(
+                parquet_schema.fields(),
+                &Some(SchemaInferenceOptions {
+                    int96_coerce_to_timeunit: tu,
+                }),
+            );
+            assert_eq!(arrow_fields, fields);
+        }
+        Ok(())
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/schema/metadata.rs b/crates/nano-arrow/src/io/parquet/read/schema/metadata.rs
new file mode 100644
index 000000000000..574ff08d1fd5
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/schema/metadata.rs
@@ -0,0 +1,55 @@
+use base64::engine::general_purpose;
+use base64::Engine as _;
+pub use parquet2::metadata::KeyValue;
+
+use super::super::super::ARROW_SCHEMA_META_KEY;
+use crate::datatypes::{Metadata, Schema};
+use crate::error::{Error, Result};
+use crate::io::ipc::read::deserialize_schema;
+
+/// Reads an arrow schema from Parquet's file metadata. Returns `None` if no schema was found.
+/// # Errors
+/// Errors iff the schema cannot be correctly parsed.
+pub fn read_schema_from_metadata(metadata: &mut Metadata) -> Result<Option<Schema>> {
+    metadata
+        .remove(ARROW_SCHEMA_META_KEY)
+        .map(|encoded| get_arrow_schema_from_metadata(&encoded))
+        .transpose()
+}
+
+/// Try to convert Arrow schema metadata into a schema
+fn get_arrow_schema_from_metadata(encoded_meta: &str) -> Result<Schema> {
+    let decoded = general_purpose::STANDARD.decode(encoded_meta);
+    match decoded {
+        Ok(bytes) => {
+            let slice = if bytes[0..4] == [255u8; 4] {
+                &bytes[8..]
+            } else {
+                bytes.as_slice()
+            };
+            deserialize_schema(slice).map(|x| x.0)
+        },
+        Err(err) => {
+            // The C++ implementation returns an error if the schema can't be parsed.
+            Err(Error::InvalidArgumentError(format!(
+                "Unable to decode the encoded schema stored in {ARROW_SCHEMA_META_KEY}, {err:?}"
+            )))
+        },
+    }
+}
+
+pub(super) fn parse_key_value_metadata(key_value_metadata: &Option<Vec<KeyValue>>) -> Metadata {
+    key_value_metadata
+        .as_ref()
+        .map(|key_values| {
+            key_values
+                .iter()
+                .filter_map(|kv| {
+                    kv.value
+                        .as_ref()
+                        .map(|value| (kv.key.clone(), value.clone()))
+                })
+                .collect()
+        })
+        .unwrap_or_default()
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/schema/mod.rs b/crates/nano-arrow/src/io/parquet/read/schema/mod.rs
new file mode 100644
index 000000000000..8b2394684440
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/schema/mod.rs
@@ -0,0 +1,58 @@
+//! APIs to handle Parquet <-> Arrow schemas.
+use crate::datatypes::{Schema, TimeUnit};
+use crate::error::Result;
+
+mod convert;
+mod metadata;
+
+pub(crate) use convert::*;
+pub use convert::{parquet_to_arrow_schema, parquet_to_arrow_schema_with_options};
+pub use metadata::read_schema_from_metadata;
+pub use parquet2::metadata::{FileMetaData, KeyValue, SchemaDescriptor};
+pub use parquet2::schema::types::ParquetType;
+
+use self::metadata::parse_key_value_metadata;
+
+/// Options when inferring schemas from Parquet
+pub struct SchemaInferenceOptions {
+    /// When inferring schemas from the Parquet INT96 timestamp type, this is the corresponding TimeUnit
+    /// in the inferred Arrow Timestamp type.
+    ///
+    /// This defaults to `TimeUnit::Nanosecond`, but INT96 timestamps outside of the range of years 1678-2262,
+    /// will overflow when parsed as `Timestamp(TimeUnit::Nanosecond)`. Setting this to a lower resolution
+    /// (e.g. TimeUnit::Milliseconds) will result in loss of precision, but support a larger range of dates
+    /// without overflowing when parsing the data.
+    pub int96_coerce_to_timeunit: TimeUnit,
+}
+
+impl Default for SchemaInferenceOptions {
+    fn default() -> Self {
+        SchemaInferenceOptions {
+            int96_coerce_to_timeunit: TimeUnit::Nanosecond,
+        }
+    }
+}
+
+/// Infers a [`Schema`] from parquet's [`FileMetaData`]. This first looks for the metadata key
+/// `"ARROW:schema"`; if it does not exist, it converts the parquet types declared in the
+/// file's parquet schema to Arrow's equivalent.
+/// # Error
+/// This function errors iff the key `"ARROW:schema"` exists but is not correctly encoded,
+/// indicating that that the file's arrow metadata was incorrectly written.
+pub fn infer_schema(file_metadata: &FileMetaData) -> Result<Schema> {
+    infer_schema_with_options(file_metadata, &None)
+}
+
+/// Like [`infer_schema`] but with configurable options which affects the behavior of inference
+pub fn infer_schema_with_options(
+    file_metadata: &FileMetaData,
+    options: &Option<SchemaInferenceOptions>,
+) -> Result<Schema> {
+    let mut metadata = parse_key_value_metadata(file_metadata.key_value_metadata());
+
+    let schema = read_schema_from_metadata(&mut metadata)?;
+    Ok(schema.unwrap_or_else(|| {
+        let fields = parquet_to_arrow_schema_with_options(file_metadata.schema().fields(), options);
+        Schema { fields, metadata }
+    }))
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/statistics/binary.rs b/crates/nano-arrow/src/io/parquet/read/statistics/binary.rs
new file mode 100644
index 000000000000..aeb43a6b3e0b
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/statistics/binary.rs
@@ -0,0 +1,24 @@
+use parquet2::statistics::{BinaryStatistics, Statistics as ParquetStatistics};
+
+use crate::array::{MutableArray, MutableBinaryArray};
+use crate::error::Result;
+use crate::offset::Offset;
+
+pub(super) fn push<O: Offset>(
+    from: Option<&dyn ParquetStatistics>,
+    min: &mut dyn MutableArray,
+    max: &mut dyn MutableArray,
+) -> Result<()> {
+    let min = min
+        .as_mut_any()
+        .downcast_mut::<MutableBinaryArray<O>>()
+        .unwrap();
+    let max = max
+        .as_mut_any()
+        .downcast_mut::<MutableBinaryArray<O>>()
+        .unwrap();
+    let from = from.map(|s| s.as_any().downcast_ref::<BinaryStatistics>().unwrap());
+    min.push(from.and_then(|s| s.min_value.as_ref()));
+    max.push(from.and_then(|s| s.max_value.as_ref()));
+    Ok(())
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/statistics/boolean.rs b/crates/nano-arrow/src/io/parquet/read/statistics/boolean.rs
new file mode 100644
index 000000000000..ebb0ce3dade2
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/statistics/boolean.rs
@@ -0,0 +1,23 @@
+use parquet2::statistics::{BooleanStatistics, Statistics as ParquetStatistics};
+
+use crate::array::{MutableArray, MutableBooleanArray};
+use crate::error::Result;
+
+pub(super) fn push(
+    from: Option<&dyn ParquetStatistics>,
+    min: &mut dyn MutableArray,
+    max: &mut dyn MutableArray,
+) -> Result<()> {
+    let min = min
+        .as_mut_any()
+        .downcast_mut::<MutableBooleanArray>()
+        .unwrap();
+    let max = max
+        .as_mut_any()
+        .downcast_mut::<MutableBooleanArray>()
+        .unwrap();
+    let from = from.map(|s| s.as_any().downcast_ref::<BooleanStatistics>().unwrap());
+    min.push(from.and_then(|s| s.min_value));
+    max.push(from.and_then(|s| s.max_value));
+    Ok(())
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/statistics/dictionary.rs b/crates/nano-arrow/src/io/parquet/read/statistics/dictionary.rs
new file mode 100644
index 000000000000..f6e2fdddcce9
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/statistics/dictionary.rs
@@ -0,0 +1,69 @@
+use super::make_mutable;
+use crate::array::*;
+use crate::datatypes::{DataType, PhysicalType};
+use crate::error::Result;
+
+#[derive(Debug)]
+pub struct DynMutableDictionary {
+    data_type: DataType,
+    pub inner: Box<dyn MutableArray>,
+}
+
+impl DynMutableDictionary {
+    pub fn try_with_capacity(data_type: DataType, capacity: usize) -> Result<Self> {
+        let inner = if let DataType::Dictionary(_, inner, _) = &data_type {
+            inner.as_ref()
+        } else {
+            unreachable!()
+        };
+        let inner = make_mutable(inner, capacity)?;
+
+        Ok(Self { data_type, inner })
+    }
+}
+
+impl MutableArray for DynMutableDictionary {
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    fn len(&self) -> usize {
+        self.inner.len()
+    }
+
+    fn validity(&self) -> Option<&crate::bitmap::MutableBitmap> {
+        self.inner.validity()
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        let inner = self.inner.as_box();
+        match self.data_type.to_physical_type() {
+            PhysicalType::Dictionary(key) => match_integer_type!(key, |$T| {
+                let keys: Vec<$T> = (0..inner.len() as $T).collect();
+                let keys = PrimitiveArray::<$T>::from_vec(keys);
+                Box::new(DictionaryArray::<$T>::try_new(self.data_type.clone(), keys, inner).unwrap())
+            }),
+            _ => todo!(),
+        }
+    }
+
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    fn as_mut_any(&mut self) -> &mut dyn std::any::Any {
+        self
+    }
+
+    fn push_null(&mut self) {
+        todo!()
+    }
+
+    fn reserve(&mut self, _: usize) {
+        todo!();
+    }
+
+    fn shrink_to_fit(&mut self) {
+        todo!()
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/statistics/fixlen.rs b/crates/nano-arrow/src/io/parquet/read/statistics/fixlen.rs
new file mode 100644
index 000000000000..1f9db20d9c9a
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/statistics/fixlen.rs
@@ -0,0 +1,146 @@
+use ethnum::I256;
+use parquet2::statistics::{FixedLenStatistics, Statistics as ParquetStatistics};
+
+use super::super::{convert_days_ms, convert_i128};
+use crate::array::*;
+use crate::error::Result;
+use crate::io::parquet::read::convert_i256;
+use crate::types::{days_ms, i256};
+
+pub(super) fn push_i128(
+    from: Option<&dyn ParquetStatistics>,
+    n: usize,
+    min: &mut dyn MutableArray,
+    max: &mut dyn MutableArray,
+) -> Result<()> {
+    let min = min
+        .as_mut_any()
+        .downcast_mut::<MutablePrimitiveArray<i128>>()
+        .unwrap();
+    let max = max
+        .as_mut_any()
+        .downcast_mut::<MutablePrimitiveArray<i128>>()
+        .unwrap();
+    let from = from.map(|s| s.as_any().downcast_ref::<FixedLenStatistics>().unwrap());
+
+    min.push(from.and_then(|s| s.min_value.as_deref().map(|x| convert_i128(x, n))));
+    max.push(from.and_then(|s| s.max_value.as_deref().map(|x| convert_i128(x, n))));
+
+    Ok(())
+}
+
+pub(super) fn push_i256_with_i128(
+    from: Option<&dyn ParquetStatistics>,
+    n: usize,
+    min: &mut dyn MutableArray,
+    max: &mut dyn MutableArray,
+) -> Result<()> {
+    let min = min
+        .as_mut_any()
+        .downcast_mut::<MutablePrimitiveArray<i256>>()
+        .unwrap();
+    let max = max
+        .as_mut_any()
+        .downcast_mut::<MutablePrimitiveArray<i256>>()
+        .unwrap();
+    let from = from.map(|s| s.as_any().downcast_ref::<FixedLenStatistics>().unwrap());
+
+    min.push(from.and_then(|s| {
+        s.min_value
+            .as_deref()
+            .map(|x| i256(I256::new(convert_i128(x, n))))
+    }));
+    max.push(from.and_then(|s| {
+        s.max_value
+            .as_deref()
+            .map(|x| i256(I256::new(convert_i128(x, n))))
+    }));
+
+    Ok(())
+}
+
+pub(super) fn push_i256(
+    from: Option<&dyn ParquetStatistics>,
+    min: &mut dyn MutableArray,
+    max: &mut dyn MutableArray,
+) -> Result<()> {
+    let min = min
+        .as_mut_any()
+        .downcast_mut::<MutablePrimitiveArray<i256>>()
+        .unwrap();
+    let max = max
+        .as_mut_any()
+        .downcast_mut::<MutablePrimitiveArray<i256>>()
+        .unwrap();
+    let from = from.map(|s| s.as_any().downcast_ref::<FixedLenStatistics>().unwrap());
+
+    min.push(from.and_then(|s| s.min_value.as_deref().map(convert_i256)));
+    max.push(from.and_then(|s| s.max_value.as_deref().map(convert_i256)));
+
+    Ok(())
+}
+
+pub(super) fn push(
+    from: Option<&dyn ParquetStatistics>,
+    min: &mut dyn MutableArray,
+    max: &mut dyn MutableArray,
+) -> Result<()> {
+    let min = min
+        .as_mut_any()
+        .downcast_mut::<MutableFixedSizeBinaryArray>()
+        .unwrap();
+    let max = max
+        .as_mut_any()
+        .downcast_mut::<MutableFixedSizeBinaryArray>()
+        .unwrap();
+    let from = from.map(|s| s.as_any().downcast_ref::<FixedLenStatistics>().unwrap());
+    min.push(from.and_then(|s| s.min_value.as_ref()));
+    max.push(from.and_then(|s| s.max_value.as_ref()));
+    Ok(())
+}
+
+fn convert_year_month(value: &[u8]) -> i32 {
+    i32::from_le_bytes(value[..4].try_into().unwrap())
+}
+
+pub(super) fn push_year_month(
+    from: Option<&dyn ParquetStatistics>,
+    min: &mut dyn MutableArray,
+    max: &mut dyn MutableArray,
+) -> Result<()> {
+    let min = min
+        .as_mut_any()
+        .downcast_mut::<MutablePrimitiveArray<i32>>()
+        .unwrap();
+    let max = max
+        .as_mut_any()
+        .downcast_mut::<MutablePrimitiveArray<i32>>()
+        .unwrap();
+    let from = from.map(|s| s.as_any().downcast_ref::<FixedLenStatistics>().unwrap());
+
+    min.push(from.and_then(|s| s.min_value.as_deref().map(convert_year_month)));
+    max.push(from.and_then(|s| s.max_value.as_deref().map(convert_year_month)));
+
+    Ok(())
+}
+
+pub(super) fn push_days_ms(
+    from: Option<&dyn ParquetStatistics>,
+    min: &mut dyn MutableArray,
+    max: &mut dyn MutableArray,
+) -> Result<()> {
+    let min = min
+        .as_mut_any()
+        .downcast_mut::<MutablePrimitiveArray<days_ms>>()
+        .unwrap();
+    let max = max
+        .as_mut_any()
+        .downcast_mut::<MutablePrimitiveArray<days_ms>>()
+        .unwrap();
+    let from = from.map(|s| s.as_any().downcast_ref::<FixedLenStatistics>().unwrap());
+
+    min.push(from.and_then(|s| s.min_value.as_deref().map(convert_days_ms)));
+    max.push(from.and_then(|s| s.max_value.as_deref().map(convert_days_ms)));
+
+    Ok(())
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/statistics/list.rs b/crates/nano-arrow/src/io/parquet/read/statistics/list.rs
new file mode 100644
index 000000000000..cb22cbf7063a
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/statistics/list.rs
@@ -0,0 +1,85 @@
+use super::make_mutable;
+use crate::array::*;
+use crate::datatypes::DataType;
+use crate::error::Result;
+use crate::offset::Offsets;
+
+#[derive(Debug)]
+pub struct DynMutableListArray {
+    data_type: DataType,
+    pub inner: Box<dyn MutableArray>,
+}
+
+impl DynMutableListArray {
+    pub fn try_with_capacity(data_type: DataType, capacity: usize) -> Result<Self> {
+        let inner = match data_type.to_logical_type() {
+            DataType::List(inner) | DataType::LargeList(inner) => inner.data_type(),
+            _ => unreachable!(),
+        };
+        let inner = make_mutable(inner, capacity)?;
+
+        Ok(Self { data_type, inner })
+    }
+}
+
+impl MutableArray for DynMutableListArray {
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    fn len(&self) -> usize {
+        self.inner.len()
+    }
+
+    fn validity(&self) -> Option<&crate::bitmap::MutableBitmap> {
+        self.inner.validity()
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        let inner = self.inner.as_box();
+
+        match self.data_type.to_logical_type() {
+            DataType::List(_) => {
+                let offsets =
+                    Offsets::try_from_lengths(std::iter::repeat(1).take(inner.len())).unwrap();
+                Box::new(ListArray::<i32>::new(
+                    self.data_type.clone(),
+                    offsets.into(),
+                    inner,
+                    None,
+                ))
+            },
+            DataType::LargeList(_) => {
+                let offsets =
+                    Offsets::try_from_lengths(std::iter::repeat(1).take(inner.len())).unwrap();
+                Box::new(ListArray::<i64>::new(
+                    self.data_type.clone(),
+                    offsets.into(),
+                    inner,
+                    None,
+                ))
+            },
+            _ => unreachable!(),
+        }
+    }
+
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    fn as_mut_any(&mut self) -> &mut dyn std::any::Any {
+        self
+    }
+
+    fn push_null(&mut self) {
+        todo!()
+    }
+
+    fn reserve(&mut self, _: usize) {
+        todo!();
+    }
+
+    fn shrink_to_fit(&mut self) {
+        todo!()
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/statistics/map.rs b/crates/nano-arrow/src/io/parquet/read/statistics/map.rs
new file mode 100644
index 000000000000..d6b2a73388f5
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/statistics/map.rs
@@ -0,0 +1,65 @@
+use super::make_mutable;
+use crate::array::{Array, MapArray, MutableArray};
+use crate::datatypes::DataType;
+use crate::error::Error;
+
+#[derive(Debug)]
+pub struct DynMutableMapArray {
+    data_type: DataType,
+    pub inner: Box<dyn MutableArray>,
+}
+
+impl DynMutableMapArray {
+    pub fn try_with_capacity(data_type: DataType, capacity: usize) -> Result<Self, Error> {
+        let inner = match data_type.to_logical_type() {
+            DataType::Map(inner, _) => inner,
+            _ => unreachable!(),
+        };
+        let inner = make_mutable(inner.data_type(), capacity)?;
+
+        Ok(Self { data_type, inner })
+    }
+}
+
+impl MutableArray for DynMutableMapArray {
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    fn len(&self) -> usize {
+        self.inner.len()
+    }
+
+    fn validity(&self) -> Option<&crate::bitmap::MutableBitmap> {
+        None
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        Box::new(MapArray::new(
+            self.data_type.clone(),
+            vec![0, self.inner.len() as i32].try_into().unwrap(),
+            self.inner.as_box(),
+            None,
+        ))
+    }
+
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    fn as_mut_any(&mut self) -> &mut dyn std::any::Any {
+        self
+    }
+
+    fn push_null(&mut self) {
+        todo!()
+    }
+
+    fn reserve(&mut self, _: usize) {
+        todo!();
+    }
+
+    fn shrink_to_fit(&mut self) {
+        todo!()
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/statistics/mod.rs b/crates/nano-arrow/src/io/parquet/read/statistics/mod.rs
new file mode 100644
index 000000000000..3048952530a6
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/statistics/mod.rs
@@ -0,0 +1,577 @@
+//! APIs exposing `parquet2`'s statistics as arrow's statistics.
+use std::collections::VecDeque;
+use std::sync::Arc;
+
+use ethnum::I256;
+use parquet2::metadata::RowGroupMetaData;
+use parquet2::schema::types::{
+    PhysicalType as ParquetPhysicalType, PrimitiveType as ParquetPrimitiveType,
+};
+use parquet2::statistics::{
+    BinaryStatistics, BooleanStatistics, FixedLenStatistics, PrimitiveStatistics,
+    Statistics as ParquetStatistics,
+};
+use parquet2::types::int96_to_i64_ns;
+
+use crate::array::*;
+use crate::datatypes::{DataType, Field, IntervalUnit, PhysicalType};
+use crate::error::{Error, Result};
+use crate::types::i256;
+
+mod binary;
+mod boolean;
+mod dictionary;
+mod fixlen;
+mod list;
+mod map;
+mod null;
+mod primitive;
+mod struct_;
+mod utf8;
+
+use self::list::DynMutableListArray;
+use super::get_field_columns;
+
+/// Arrow-deserialized parquet Statistics of a file
+#[derive(Debug, PartialEq)]
+pub struct Statistics {
+    /// number of nulls. This is a [`UInt64Array`] for non-nested types
+    pub null_count: Box<dyn Array>,
+    /// number of dictinct values. This is a [`UInt64Array`] for non-nested types
+    pub distinct_count: Box<dyn Array>,
+    /// Minimum
+    pub min_value: Box<dyn Array>,
+    /// Maximum
+    pub max_value: Box<dyn Array>,
+}
+
+/// Arrow-deserialized parquet Statistics of a file
+#[derive(Debug)]
+struct MutableStatistics {
+    /// number of nulls
+    pub null_count: Box<dyn MutableArray>,
+    /// number of dictinct values
+    pub distinct_count: Box<dyn MutableArray>,
+    /// Minimum
+    pub min_value: Box<dyn MutableArray>,
+    /// Maximum
+    pub max_value: Box<dyn MutableArray>,
+}
+
+impl From<MutableStatistics> for Statistics {
+    fn from(mut s: MutableStatistics) -> Self {
+        let null_count = if let PhysicalType::Struct = s.null_count.data_type().to_physical_type() {
+            s.null_count
+                .as_box()
+                .as_any()
+                .downcast_ref::<StructArray>()
+                .unwrap()
+                .clone()
+                .boxed()
+        } else if let PhysicalType::Map = s.null_count.data_type().to_physical_type() {
+            s.null_count
+                .as_box()
+                .as_any()
+                .downcast_ref::<MapArray>()
+                .unwrap()
+                .clone()
+                .boxed()
+        } else if let PhysicalType::List = s.null_count.data_type().to_physical_type() {
+            s.null_count
+                .as_box()
+                .as_any()
+                .downcast_ref::<ListArray<i32>>()
+                .unwrap()
+                .clone()
+                .boxed()
+        } else if let PhysicalType::LargeList = s.null_count.data_type().to_physical_type() {
+            s.null_count
+                .as_box()
+                .as_any()
+                .downcast_ref::<ListArray<i64>>()
+                .unwrap()
+                .clone()
+                .boxed()
+        } else {
+            s.null_count
+                .as_box()
+                .as_any()
+                .downcast_ref::<UInt64Array>()
+                .unwrap()
+                .clone()
+                .boxed()
+        };
+        let distinct_count = if let PhysicalType::Struct =
+            s.distinct_count.data_type().to_physical_type()
+        {
+            s.distinct_count
+                .as_box()
+                .as_any()
+                .downcast_ref::<StructArray>()
+                .unwrap()
+                .clone()
+                .boxed()
+        } else if let PhysicalType::Map = s.distinct_count.data_type().to_physical_type() {
+            s.distinct_count
+                .as_box()
+                .as_any()
+                .downcast_ref::<MapArray>()
+                .unwrap()
+                .clone()
+                .boxed()
+        } else if let PhysicalType::List = s.distinct_count.data_type().to_physical_type() {
+            s.distinct_count
+                .as_box()
+                .as_any()
+                .downcast_ref::<ListArray<i32>>()
+                .unwrap()
+                .clone()
+                .boxed()
+        } else if let PhysicalType::LargeList = s.distinct_count.data_type().to_physical_type() {
+            s.distinct_count
+                .as_box()
+                .as_any()
+                .downcast_ref::<ListArray<i64>>()
+                .unwrap()
+                .clone()
+                .boxed()
+        } else {
+            s.distinct_count
+                .as_box()
+                .as_any()
+                .downcast_ref::<UInt64Array>()
+                .unwrap()
+                .clone()
+                .boxed()
+        };
+        Self {
+            null_count,
+            distinct_count,
+            min_value: s.min_value.as_box(),
+            max_value: s.max_value.as_box(),
+        }
+    }
+}
+
+fn make_mutable(data_type: &DataType, capacity: usize) -> Result<Box<dyn MutableArray>> {
+    Ok(match data_type.to_physical_type() {
+        PhysicalType::Boolean => {
+            Box::new(MutableBooleanArray::with_capacity(capacity)) as Box<dyn MutableArray>
+        },
+        PhysicalType::Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+            Box::new(MutablePrimitiveArray::<$T>::with_capacity(capacity).to(data_type.clone()))
+                as Box<dyn MutableArray>
+        }),
+        PhysicalType::Binary => {
+            Box::new(MutableBinaryArray::<i32>::with_capacity(capacity)) as Box<dyn MutableArray>
+        },
+        PhysicalType::LargeBinary => {
+            Box::new(MutableBinaryArray::<i64>::with_capacity(capacity)) as Box<dyn MutableArray>
+        },
+        PhysicalType::Utf8 => {
+            Box::new(MutableUtf8Array::<i32>::with_capacity(capacity)) as Box<dyn MutableArray>
+        },
+        PhysicalType::LargeUtf8 => {
+            Box::new(MutableUtf8Array::<i64>::with_capacity(capacity)) as Box<dyn MutableArray>
+        },
+        PhysicalType::FixedSizeBinary => {
+            Box::new(MutableFixedSizeBinaryArray::try_new(data_type.clone(), vec![], None).unwrap())
+                as _
+        },
+        PhysicalType::LargeList | PhysicalType::List => Box::new(
+            DynMutableListArray::try_with_capacity(data_type.clone(), capacity)?,
+        ) as Box<dyn MutableArray>,
+        PhysicalType::Dictionary(_) => Box::new(
+            dictionary::DynMutableDictionary::try_with_capacity(data_type.clone(), capacity)?,
+        ),
+        PhysicalType::Struct => Box::new(struct_::DynMutableStructArray::try_with_capacity(
+            data_type.clone(),
+            capacity,
+        )?),
+        PhysicalType::Map => Box::new(map::DynMutableMapArray::try_with_capacity(
+            data_type.clone(),
+            capacity,
+        )?),
+        PhysicalType::Null => {
+            Box::new(MutableNullArray::new(DataType::Null, 0)) as Box<dyn MutableArray>
+        },
+        other => {
+            return Err(Error::NotYetImplemented(format!(
+                "Deserializing parquet stats from {other:?} is still not implemented"
+            )))
+        },
+    })
+}
+
+fn create_dt(data_type: &DataType) -> DataType {
+    if let DataType::Struct(fields) = data_type.to_logical_type() {
+        DataType::Struct(
+            fields
+                .iter()
+                .map(|f| Field::new(&f.name, create_dt(&f.data_type), f.is_nullable))
+                .collect(),
+        )
+    } else if let DataType::Map(f, ordered) = data_type.to_logical_type() {
+        DataType::Map(
+            Box::new(Field::new(&f.name, create_dt(&f.data_type), f.is_nullable)),
+            *ordered,
+        )
+    } else if let DataType::List(f) = data_type.to_logical_type() {
+        DataType::List(Box::new(Field::new(
+            &f.name,
+            create_dt(&f.data_type),
+            f.is_nullable,
+        )))
+    } else if let DataType::LargeList(f) = data_type.to_logical_type() {
+        DataType::LargeList(Box::new(Field::new(
+            &f.name,
+            create_dt(&f.data_type),
+            f.is_nullable,
+        )))
+    } else {
+        DataType::UInt64
+    }
+}
+
+impl MutableStatistics {
+    fn try_new(field: &Field) -> Result<Self> {
+        let min_value = make_mutable(&field.data_type, 0)?;
+        let max_value = make_mutable(&field.data_type, 0)?;
+
+        let dt = create_dt(&field.data_type);
+        Ok(Self {
+            null_count: make_mutable(&dt, 0)?,
+            distinct_count: make_mutable(&dt, 0)?,
+            min_value,
+            max_value,
+        })
+    }
+}
+
+fn push_others(
+    from: Option<&dyn ParquetStatistics>,
+    distinct_count: &mut UInt64Vec,
+    null_count: &mut UInt64Vec,
+) {
+    let from = if let Some(from) = from {
+        from
+    } else {
+        distinct_count.push(None);
+        null_count.push(None);
+        return;
+    };
+    let (distinct, null_count1) = match from.physical_type() {
+        ParquetPhysicalType::Boolean => {
+            let from = from.as_any().downcast_ref::<BooleanStatistics>().unwrap();
+            (from.distinct_count, from.null_count)
+        },
+        ParquetPhysicalType::Int32 => {
+            let from = from
+                .as_any()
+                .downcast_ref::<PrimitiveStatistics<i32>>()
+                .unwrap();
+            (from.distinct_count, from.null_count)
+        },
+        ParquetPhysicalType::Int64 => {
+            let from = from
+                .as_any()
+                .downcast_ref::<PrimitiveStatistics<i64>>()
+                .unwrap();
+            (from.distinct_count, from.null_count)
+        },
+        ParquetPhysicalType::Int96 => {
+            let from = from
+                .as_any()
+                .downcast_ref::<PrimitiveStatistics<[u32; 3]>>()
+                .unwrap();
+            (from.distinct_count, from.null_count)
+        },
+        ParquetPhysicalType::Float => {
+            let from = from
+                .as_any()
+                .downcast_ref::<PrimitiveStatistics<f32>>()
+                .unwrap();
+            (from.distinct_count, from.null_count)
+        },
+        ParquetPhysicalType::Double => {
+            let from = from
+                .as_any()
+                .downcast_ref::<PrimitiveStatistics<f64>>()
+                .unwrap();
+            (from.distinct_count, from.null_count)
+        },
+        ParquetPhysicalType::ByteArray => {
+            let from = from.as_any().downcast_ref::<BinaryStatistics>().unwrap();
+            (from.distinct_count, from.null_count)
+        },
+        ParquetPhysicalType::FixedLenByteArray(_) => {
+            let from = from.as_any().downcast_ref::<FixedLenStatistics>().unwrap();
+            (from.distinct_count, from.null_count)
+        },
+    };
+
+    distinct_count.push(distinct.map(|x| x as u64));
+    null_count.push(null_count1.map(|x| x as u64));
+}
+
+fn push(
+    stats: &mut VecDeque<(Option<Arc<dyn ParquetStatistics>>, ParquetPrimitiveType)>,
+    min: &mut dyn MutableArray,
+    max: &mut dyn MutableArray,
+    distinct_count: &mut dyn MutableArray,
+    null_count: &mut dyn MutableArray,
+) -> Result<()> {
+    match min.data_type().to_logical_type() {
+        List(_) | LargeList(_) => {
+            let min = min
+                .as_mut_any()
+                .downcast_mut::<list::DynMutableListArray>()
+                .unwrap();
+            let max = max
+                .as_mut_any()
+                .downcast_mut::<list::DynMutableListArray>()
+                .unwrap();
+            let distinct_count = distinct_count
+                .as_mut_any()
+                .downcast_mut::<list::DynMutableListArray>()
+                .unwrap();
+            let null_count = null_count
+                .as_mut_any()
+                .downcast_mut::<list::DynMutableListArray>()
+                .unwrap();
+            return push(
+                stats,
+                min.inner.as_mut(),
+                max.inner.as_mut(),
+                distinct_count.inner.as_mut(),
+                null_count.inner.as_mut(),
+            );
+        },
+        Dictionary(_, _, _) => {
+            let min = min
+                .as_mut_any()
+                .downcast_mut::<dictionary::DynMutableDictionary>()
+                .unwrap();
+            let max = max
+                .as_mut_any()
+                .downcast_mut::<dictionary::DynMutableDictionary>()
+                .unwrap();
+            return push(
+                stats,
+                min.inner.as_mut(),
+                max.inner.as_mut(),
+                distinct_count,
+                null_count,
+            );
+        },
+        Struct(_) => {
+            let min = min
+                .as_mut_any()
+                .downcast_mut::<struct_::DynMutableStructArray>()
+                .unwrap();
+            let max = max
+                .as_mut_any()
+                .downcast_mut::<struct_::DynMutableStructArray>()
+                .unwrap();
+            let distinct_count = distinct_count
+                .as_mut_any()
+                .downcast_mut::<struct_::DynMutableStructArray>()
+                .unwrap();
+            let null_count = null_count
+                .as_mut_any()
+                .downcast_mut::<struct_::DynMutableStructArray>()
+                .unwrap();
+            return min
+                .inner
+                .iter_mut()
+                .zip(max.inner.iter_mut())
+                .zip(distinct_count.inner.iter_mut())
+                .zip(null_count.inner.iter_mut())
+                .try_for_each(|(((min, max), distinct_count), null_count)| {
+                    push(
+                        stats,
+                        min.as_mut(),
+                        max.as_mut(),
+                        distinct_count.as_mut(),
+                        null_count.as_mut(),
+                    )
+                });
+        },
+        Map(_, _) => {
+            let min = min
+                .as_mut_any()
+                .downcast_mut::<map::DynMutableMapArray>()
+                .unwrap();
+            let max = max
+                .as_mut_any()
+                .downcast_mut::<map::DynMutableMapArray>()
+                .unwrap();
+            let distinct_count = distinct_count
+                .as_mut_any()
+                .downcast_mut::<map::DynMutableMapArray>()
+                .unwrap();
+            let null_count = null_count
+                .as_mut_any()
+                .downcast_mut::<map::DynMutableMapArray>()
+                .unwrap();
+            return push(
+                stats,
+                min.inner.as_mut(),
+                max.inner.as_mut(),
+                distinct_count.inner.as_mut(),
+                null_count.inner.as_mut(),
+            );
+        },
+        _ => {},
+    }
+
+    let (from, type_) = stats.pop_front().unwrap();
+    let from = from.as_deref();
+
+    let distinct_count = distinct_count
+        .as_mut_any()
+        .downcast_mut::<UInt64Vec>()
+        .unwrap();
+    let null_count = null_count.as_mut_any().downcast_mut::<UInt64Vec>().unwrap();
+
+    push_others(from, distinct_count, null_count);
+
+    let physical_type = &type_.physical_type;
+
+    use DataType::*;
+    match min.data_type().to_logical_type() {
+        Boolean => boolean::push(from, min, max),
+        Int8 => primitive::push(from, min, max, |x: i32| Ok(x as i8)),
+        Int16 => primitive::push(from, min, max, |x: i32| Ok(x as i16)),
+        Date32 | Time32(_) => primitive::push::<i32, i32, _>(from, min, max, Ok),
+        Interval(IntervalUnit::YearMonth) => fixlen::push_year_month(from, min, max),
+        Interval(IntervalUnit::DayTime) => fixlen::push_days_ms(from, min, max),
+        UInt8 => primitive::push(from, min, max, |x: i32| Ok(x as u8)),
+        UInt16 => primitive::push(from, min, max, |x: i32| Ok(x as u16)),
+        UInt32 => match physical_type {
+            // some implementations of parquet write arrow's u32 into i64.
+            ParquetPhysicalType::Int64 => primitive::push(from, min, max, |x: i64| Ok(x as u32)),
+            ParquetPhysicalType::Int32 => primitive::push(from, min, max, |x: i32| Ok(x as u32)),
+            other => Err(Error::NotYetImplemented(format!(
+                "Can't decode UInt32 type from parquet type {other:?}"
+            ))),
+        },
+        Int32 => primitive::push::<i32, i32, _>(from, min, max, Ok),
+        Date64 => match physical_type {
+            ParquetPhysicalType::Int64 => primitive::push::<i64, i64, _>(from, min, max, Ok),
+            // some implementations of parquet write arrow's date64 into i32.
+            ParquetPhysicalType::Int32 => {
+                primitive::push(from, min, max, |x: i32| Ok(x as i64 * 86400000))
+            },
+            other => Err(Error::NotYetImplemented(format!(
+                "Can't decode Date64 type from parquet type {other:?}"
+            ))),
+        },
+        Int64 | Time64(_) | Duration(_) => primitive::push::<i64, i64, _>(from, min, max, Ok),
+        UInt64 => primitive::push(from, min, max, |x: i64| Ok(x as u64)),
+        Timestamp(time_unit, _) => {
+            let time_unit = *time_unit;
+            if physical_type == &ParquetPhysicalType::Int96 {
+                let from = from.map(|from| {
+                    let from = from
+                        .as_any()
+                        .downcast_ref::<PrimitiveStatistics<[u32; 3]>>()
+                        .unwrap();
+                    PrimitiveStatistics::<i64> {
+                        primitive_type: from.primitive_type.clone(),
+                        null_count: from.null_count,
+                        distinct_count: from.distinct_count,
+                        min_value: from.min_value.map(int96_to_i64_ns),
+                        max_value: from.max_value.map(int96_to_i64_ns),
+                    }
+                });
+                primitive::push(
+                    from.as_ref().map(|x| x as &dyn ParquetStatistics),
+                    min,
+                    max,
+                    |x: i64| {
+                        Ok(primitive::timestamp(
+                            type_.logical_type.as_ref(),
+                            time_unit,
+                            x,
+                        ))
+                    },
+                )
+            } else {
+                primitive::push(from, min, max, |x: i64| {
+                    Ok(primitive::timestamp(
+                        type_.logical_type.as_ref(),
+                        time_unit,
+                        x,
+                    ))
+                })
+            }
+        },
+        Float32 => primitive::push::<f32, f32, _>(from, min, max, Ok),
+        Float64 => primitive::push::<f64, f64, _>(from, min, max, Ok),
+        Decimal(_, _) => match physical_type {
+            ParquetPhysicalType::Int32 => primitive::push(from, min, max, |x: i32| Ok(x as i128)),
+            ParquetPhysicalType::Int64 => primitive::push(from, min, max, |x: i64| Ok(x as i128)),
+            ParquetPhysicalType::FixedLenByteArray(n) if *n > 16 => Err(Error::NotYetImplemented(
+                format!("Can't decode Decimal128 type from Fixed Size Byte Array of len {n:?}"),
+            )),
+            ParquetPhysicalType::FixedLenByteArray(n) => fixlen::push_i128(from, *n, min, max),
+            _ => unreachable!(),
+        },
+        Decimal256(_, _) => match physical_type {
+            ParquetPhysicalType::Int32 => {
+                primitive::push(from, min, max, |x: i32| Ok(i256(I256::new(x.into()))))
+            },
+            ParquetPhysicalType::Int64 => {
+                primitive::push(from, min, max, |x: i64| Ok(i256(I256::new(x.into()))))
+            },
+            ParquetPhysicalType::FixedLenByteArray(n) if *n <= 16 => {
+                fixlen::push_i256_with_i128(from, *n, min, max)
+            },
+            ParquetPhysicalType::FixedLenByteArray(n) if *n > 32 => Err(Error::NotYetImplemented(
+                format!("Can't decode Decimal256 type from Fixed Size Byte Array of len {n:?}"),
+            )),
+            ParquetPhysicalType::FixedLenByteArray(_) => fixlen::push_i256(from, min, max),
+            _ => unreachable!(),
+        },
+        Binary => binary::push::<i32>(from, min, max),
+        LargeBinary => binary::push::<i64>(from, min, max),
+        Utf8 => utf8::push::<i32>(from, min, max),
+        LargeUtf8 => utf8::push::<i64>(from, min, max),
+        FixedSizeBinary(_) => fixlen::push(from, min, max),
+        Null => null::push(min, max),
+        other => todo!("{:?}", other),
+    }
+}
+
+/// Deserializes the statistics in the column chunks from all `row_groups`
+/// into [`Statistics`] associated from `field`'s name.
+///
+/// # Errors
+/// This function errors if the deserialization of the statistics fails (e.g. invalid utf8)
+pub fn deserialize(field: &Field, row_groups: &[RowGroupMetaData]) -> Result<Statistics> {
+    let mut statistics = MutableStatistics::try_new(field)?;
+
+    // transpose
+    row_groups.iter().try_for_each(|group| {
+        let columns = get_field_columns(group.columns(), field.name.as_ref());
+        let mut stats = columns
+            .into_iter()
+            .map(|column| {
+                Ok((
+                    column.statistics().transpose()?,
+                    column.descriptor().descriptor.primitive_type.clone(),
+                ))
+            })
+            .collect::<Result<VecDeque<(Option<_>, ParquetPrimitiveType)>>>()?;
+        push(
+            &mut stats,
+            statistics.min_value.as_mut(),
+            statistics.max_value.as_mut(),
+            statistics.distinct_count.as_mut(),
+            statistics.null_count.as_mut(),
+        )
+    })?;
+
+    Ok(statistics.into())
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/statistics/null.rs b/crates/nano-arrow/src/io/parquet/read/statistics/null.rs
new file mode 100644
index 000000000000..9102720ebc5c
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/statistics/null.rs
@@ -0,0 +1,11 @@
+use crate::array::*;
+use crate::error::Result;
+
+pub(super) fn push(min: &mut dyn MutableArray, max: &mut dyn MutableArray) -> Result<()> {
+    let min = min.as_mut_any().downcast_mut::<MutableNullArray>().unwrap();
+    let max = max.as_mut_any().downcast_mut::<MutableNullArray>().unwrap();
+    min.push_null();
+    max.push_null();
+
+    Ok(())
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/statistics/primitive.rs b/crates/nano-arrow/src/io/parquet/read/statistics/primitive.rs
new file mode 100644
index 000000000000..849363028ad1
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/statistics/primitive.rs
@@ -0,0 +1,55 @@
+use parquet2::schema::types::{PrimitiveLogicalType, TimeUnit as ParquetTimeUnit};
+use parquet2::statistics::{PrimitiveStatistics, Statistics as ParquetStatistics};
+use parquet2::types::NativeType as ParquetNativeType;
+
+use crate::array::*;
+use crate::datatypes::TimeUnit;
+use crate::error::Result;
+use crate::types::NativeType;
+
+pub fn timestamp(logical_type: Option<&PrimitiveLogicalType>, time_unit: TimeUnit, x: i64) -> i64 {
+    let unit = if let Some(PrimitiveLogicalType::Timestamp { unit, .. }) = logical_type {
+        unit
+    } else {
+        return x;
+    };
+
+    match (unit, time_unit) {
+        (ParquetTimeUnit::Milliseconds, TimeUnit::Second) => x / 1_000,
+        (ParquetTimeUnit::Microseconds, TimeUnit::Second) => x / 1_000_000,
+        (ParquetTimeUnit::Nanoseconds, TimeUnit::Second) => x * 1_000_000_000,
+
+        (ParquetTimeUnit::Milliseconds, TimeUnit::Millisecond) => x,
+        (ParquetTimeUnit::Microseconds, TimeUnit::Millisecond) => x / 1_000,
+        (ParquetTimeUnit::Nanoseconds, TimeUnit::Millisecond) => x / 1_000_000,
+
+        (ParquetTimeUnit::Milliseconds, TimeUnit::Microsecond) => x * 1_000,
+        (ParquetTimeUnit::Microseconds, TimeUnit::Microsecond) => x,
+        (ParquetTimeUnit::Nanoseconds, TimeUnit::Microsecond) => x / 1_000,
+
+        (ParquetTimeUnit::Milliseconds, TimeUnit::Nanosecond) => x * 1_000_000,
+        (ParquetTimeUnit::Microseconds, TimeUnit::Nanosecond) => x * 1_000,
+        (ParquetTimeUnit::Nanoseconds, TimeUnit::Nanosecond) => x,
+    }
+}
+
+pub(super) fn push<P: ParquetNativeType, T: NativeType, F: Fn(P) -> Result<T> + Copy>(
+    from: Option<&dyn ParquetStatistics>,
+    min: &mut dyn MutableArray,
+    max: &mut dyn MutableArray,
+    map: F,
+) -> Result<()> {
+    let min = min
+        .as_mut_any()
+        .downcast_mut::<MutablePrimitiveArray<T>>()
+        .unwrap();
+    let max = max
+        .as_mut_any()
+        .downcast_mut::<MutablePrimitiveArray<T>>()
+        .unwrap();
+    let from = from.map(|s| s.as_any().downcast_ref::<PrimitiveStatistics<P>>().unwrap());
+    min.push(from.and_then(|s| s.min_value.map(map)).transpose()?);
+    max.push(from.and_then(|s| s.max_value.map(map)).transpose()?);
+
+    Ok(())
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/statistics/struct_.rs b/crates/nano-arrow/src/io/parquet/read/statistics/struct_.rs
new file mode 100644
index 000000000000..6aca0352701e
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/statistics/struct_.rs
@@ -0,0 +1,64 @@
+use super::make_mutable;
+use crate::array::{Array, MutableArray, StructArray};
+use crate::datatypes::DataType;
+use crate::error::Result;
+
+#[derive(Debug)]
+pub struct DynMutableStructArray {
+    data_type: DataType,
+    pub inner: Vec<Box<dyn MutableArray>>,
+}
+
+impl DynMutableStructArray {
+    pub fn try_with_capacity(data_type: DataType, capacity: usize) -> Result<Self> {
+        let inners = match data_type.to_logical_type() {
+            DataType::Struct(inner) => inner,
+            _ => unreachable!(),
+        };
+        let inner = inners
+            .iter()
+            .map(|f| make_mutable(f.data_type(), capacity))
+            .collect::<Result<Vec<_>>>()?;
+
+        Ok(Self { data_type, inner })
+    }
+}
+impl MutableArray for DynMutableStructArray {
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    fn len(&self) -> usize {
+        self.inner[0].len()
+    }
+
+    fn validity(&self) -> Option<&crate::bitmap::MutableBitmap> {
+        None
+    }
+
+    fn as_box(&mut self) -> Box<dyn Array> {
+        let inner = self.inner.iter_mut().map(|x| x.as_box()).collect();
+
+        Box::new(StructArray::new(self.data_type.clone(), inner, None))
+    }
+
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    fn as_mut_any(&mut self) -> &mut dyn std::any::Any {
+        self
+    }
+
+    fn push_null(&mut self) {
+        todo!()
+    }
+
+    fn reserve(&mut self, _: usize) {
+        todo!();
+    }
+
+    fn shrink_to_fit(&mut self) {
+        todo!()
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/read/statistics/utf8.rs b/crates/nano-arrow/src/io/parquet/read/statistics/utf8.rs
new file mode 100644
index 000000000000..da9fcb6e1119
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/read/statistics/utf8.rs
@@ -0,0 +1,31 @@
+use parquet2::statistics::{BinaryStatistics, Statistics as ParquetStatistics};
+
+use crate::array::{MutableArray, MutableUtf8Array};
+use crate::error::Result;
+use crate::offset::Offset;
+
+pub(super) fn push<O: Offset>(
+    from: Option<&dyn ParquetStatistics>,
+    min: &mut dyn MutableArray,
+    max: &mut dyn MutableArray,
+) -> Result<()> {
+    let min = min
+        .as_mut_any()
+        .downcast_mut::<MutableUtf8Array<O>>()
+        .unwrap();
+    let max = max
+        .as_mut_any()
+        .downcast_mut::<MutableUtf8Array<O>>()
+        .unwrap();
+    let from = from.map(|s| s.as_any().downcast_ref::<BinaryStatistics>().unwrap());
+
+    min.push(
+        from.and_then(|s| s.min_value.as_deref().map(simdutf8::basic::from_utf8))
+            .transpose()?,
+    );
+    max.push(
+        from.and_then(|s| s.max_value.as_deref().map(simdutf8::basic::from_utf8))
+            .transpose()?,
+    );
+    Ok(())
+}
diff --git a/crates/nano-arrow/src/io/parquet/write/binary/basic.rs b/crates/nano-arrow/src/io/parquet/write/binary/basic.rs
new file mode 100644
index 000000000000..de840e45fa5a
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/binary/basic.rs
@@ -0,0 +1,168 @@
+use parquet2::encoding::{delta_bitpacked, Encoding};
+use parquet2::page::DataPage;
+use parquet2::schema::types::PrimitiveType;
+use parquet2::statistics::{serialize_statistics, BinaryStatistics, ParquetStatistics, Statistics};
+
+use super::super::{utils, WriteOptions};
+use crate::array::{Array, BinaryArray};
+use crate::bitmap::Bitmap;
+use crate::error::{Error, Result};
+use crate::io::parquet::read::schema::is_nullable;
+use crate::offset::Offset;
+
+pub(crate) fn encode_plain<O: Offset>(
+    array: &BinaryArray<O>,
+    is_optional: bool,
+    buffer: &mut Vec<u8>,
+) {
+    // append the non-null values
+    if is_optional {
+        array.iter().for_each(|x| {
+            if let Some(x) = x {
+                // BYTE_ARRAY: first 4 bytes denote length in littleendian.
+                let len = (x.len() as u32).to_le_bytes();
+                buffer.extend_from_slice(&len);
+                buffer.extend_from_slice(x);
+            }
+        })
+    } else {
+        array.values_iter().for_each(|x| {
+            // BYTE_ARRAY: first 4 bytes denote length in littleendian.
+            let len = (x.len() as u32).to_le_bytes();
+            buffer.extend_from_slice(&len);
+            buffer.extend_from_slice(x);
+        })
+    }
+}
+
+pub fn array_to_page<O: Offset>(
+    array: &BinaryArray<O>,
+    options: WriteOptions,
+    type_: PrimitiveType,
+    encoding: Encoding,
+) -> Result<DataPage> {
+    let validity = array.validity();
+    let is_optional = is_nullable(&type_.field_info);
+
+    let mut buffer = vec![];
+    utils::write_def_levels(
+        &mut buffer,
+        is_optional,
+        validity,
+        array.len(),
+        options.version,
+    )?;
+
+    let definition_levels_byte_length = buffer.len();
+
+    match encoding {
+        Encoding::Plain => encode_plain(array, is_optional, &mut buffer),
+        Encoding::DeltaLengthByteArray => encode_delta(
+            array.values(),
+            array.offsets().buffer(),
+            array.validity(),
+            is_optional,
+            &mut buffer,
+        ),
+        _ => {
+            return Err(Error::InvalidArgumentError(format!(
+                "Datatype {:?} cannot be encoded by {:?} encoding",
+                array.data_type(),
+                encoding
+            )))
+        },
+    }
+
+    let statistics = if options.write_statistics {
+        Some(build_statistics(array, type_.clone()))
+    } else {
+        None
+    };
+
+    utils::build_plain_page(
+        buffer,
+        array.len(),
+        array.len(),
+        array.null_count(),
+        0,
+        definition_levels_byte_length,
+        statistics,
+        type_,
+        options,
+        encoding,
+    )
+}
+
+pub(crate) fn build_statistics<O: Offset>(
+    array: &BinaryArray<O>,
+    primitive_type: PrimitiveType,
+) -> ParquetStatistics {
+    let statistics = &BinaryStatistics {
+        primitive_type,
+        null_count: Some(array.null_count() as i64),
+        distinct_count: None,
+        max_value: array
+            .iter()
+            .flatten()
+            .max_by(|x, y| ord_binary(x, y))
+            .map(|x| x.to_vec()),
+        min_value: array
+            .iter()
+            .flatten()
+            .min_by(|x, y| ord_binary(x, y))
+            .map(|x| x.to_vec()),
+    } as &dyn Statistics;
+    serialize_statistics(statistics)
+}
+
+pub(crate) fn encode_delta<O: Offset>(
+    values: &[u8],
+    offsets: &[O],
+    validity: Option<&Bitmap>,
+    is_optional: bool,
+    buffer: &mut Vec<u8>,
+) {
+    if is_optional {
+        if let Some(validity) = validity {
+            let lengths = offsets
+                .windows(2)
+                .map(|w| (w[1] - w[0]).to_usize() as i64)
+                .zip(validity.iter())
+                .flat_map(|(x, is_valid)| if is_valid { Some(x) } else { None });
+            let length = offsets.len() - 1 - validity.unset_bits();
+            let lengths = utils::ExactSizedIter::new(lengths, length);
+
+            delta_bitpacked::encode(lengths, buffer);
+        } else {
+            let lengths = offsets.windows(2).map(|w| (w[1] - w[0]).to_usize() as i64);
+            delta_bitpacked::encode(lengths, buffer);
+        }
+    } else {
+        let lengths = offsets.windows(2).map(|w| (w[1] - w[0]).to_usize() as i64);
+        delta_bitpacked::encode(lengths, buffer);
+    }
+
+    buffer.extend_from_slice(
+        &values[offsets.first().unwrap().to_usize()..offsets.last().unwrap().to_usize()],
+    )
+}
+
+/// Returns the ordering of two binary values. This corresponds to pyarrows' ordering
+/// of statistics.
+pub(crate) fn ord_binary<'a>(a: &'a [u8], b: &'a [u8]) -> std::cmp::Ordering {
+    use std::cmp::Ordering::*;
+    match (a.is_empty(), b.is_empty()) {
+        (true, true) => return Equal,
+        (true, false) => return Less,
+        (false, true) => return Greater,
+        (false, false) => {},
+    }
+
+    for (v1, v2) in a.iter().zip(b.iter()) {
+        match v1.cmp(v2) {
+            Equal => continue,
+            other => return other,
+        }
+    }
+    Equal
+}
diff --git a/crates/nano-arrow/src/io/parquet/write/binary/mod.rs b/crates/nano-arrow/src/io/parquet/write/binary/mod.rs
new file mode 100644
index 000000000000..e942b4b69103
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/binary/mod.rs
@@ -0,0 +1,7 @@
+mod basic;
+mod nested;
+
+pub use basic::array_to_page;
+pub(crate) use basic::{build_statistics, encode_plain};
+pub(super) use basic::{encode_delta, ord_binary};
+pub use nested::array_to_page as nested_array_to_page;
diff --git a/crates/nano-arrow/src/io/parquet/write/binary/nested.rs b/crates/nano-arrow/src/io/parquet/write/binary/nested.rs
new file mode 100644
index 000000000000..11de9d9676a7
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/binary/nested.rs
@@ -0,0 +1,48 @@
+use parquet2::encoding::Encoding;
+use parquet2::page::DataPage;
+use parquet2::schema::types::PrimitiveType;
+
+use super::super::{nested, utils, WriteOptions};
+use super::basic::{build_statistics, encode_plain};
+use crate::array::{Array, BinaryArray};
+use crate::error::Result;
+use crate::io::parquet::read::schema::is_nullable;
+use crate::io::parquet::write::Nested;
+use crate::offset::Offset;
+
+pub fn array_to_page<O>(
+    array: &BinaryArray<O>,
+    options: WriteOptions,
+    type_: PrimitiveType,
+    nested: &[Nested],
+) -> Result<DataPage>
+where
+    O: Offset,
+{
+    let is_optional = is_nullable(&type_.field_info);
+
+    let mut buffer = vec![];
+    let (repetition_levels_byte_length, definition_levels_byte_length) =
+        nested::write_rep_and_def(options.version, nested, &mut buffer)?;
+
+    encode_plain(array, is_optional, &mut buffer);
+
+    let statistics = if options.write_statistics {
+        Some(build_statistics(array, type_.clone()))
+    } else {
+        None
+    };
+
+    utils::build_plain_page(
+        buffer,
+        nested::num_values(nested),
+        nested[0].len(),
+        array.null_count(),
+        repetition_levels_byte_length,
+        definition_levels_byte_length,
+        statistics,
+        type_,
+        options,
+        Encoding::Plain,
+    )
+}
diff --git a/crates/nano-arrow/src/io/parquet/write/boolean/basic.rs b/crates/nano-arrow/src/io/parquet/write/boolean/basic.rs
new file mode 100644
index 000000000000..833bfab09e5a
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/boolean/basic.rs
@@ -0,0 +1,92 @@
+use parquet2::encoding::hybrid_rle::bitpacked_encode;
+use parquet2::encoding::Encoding;
+use parquet2::page::DataPage;
+use parquet2::schema::types::PrimitiveType;
+use parquet2::statistics::{
+    serialize_statistics, BooleanStatistics, ParquetStatistics, Statistics,
+};
+
+use super::super::{utils, WriteOptions};
+use crate::array::*;
+use crate::error::Result;
+use crate::io::parquet::read::schema::is_nullable;
+
+fn encode(iterator: impl Iterator<Item = bool>, buffer: &mut Vec<u8>) -> Result<()> {
+    // encode values using bitpacking
+    let len = buffer.len();
+    let mut buffer = std::io::Cursor::new(buffer);
+    buffer.set_position(len as u64);
+    Ok(bitpacked_encode(&mut buffer, iterator)?)
+}
+
+pub(super) fn encode_plain(
+    array: &BooleanArray,
+    is_optional: bool,
+    buffer: &mut Vec<u8>,
+) -> Result<()> {
+    if is_optional {
+        let iter = array.iter().flatten().take(
+            array
+                .validity()
+                .as_ref()
+                .map(|x| x.len() - x.unset_bits())
+                .unwrap_or_else(|| array.len()),
+        );
+        encode(iter, buffer)
+    } else {
+        let iter = array.values().iter();
+        encode(iter, buffer)
+    }
+}
+
+pub fn array_to_page(
+    array: &BooleanArray,
+    options: WriteOptions,
+    type_: PrimitiveType,
+) -> Result<DataPage> {
+    let is_optional = is_nullable(&type_.field_info);
+
+    let validity = array.validity();
+
+    let mut buffer = vec![];
+    utils::write_def_levels(
+        &mut buffer,
+        is_optional,
+        validity,
+        array.len(),
+        options.version,
+    )?;
+
+    let definition_levels_byte_length = buffer.len();
+
+    encode_plain(array, is_optional, &mut buffer)?;
+
+    let statistics = if options.write_statistics {
+        Some(build_statistics(array))
+    } else {
+        None
+    };
+
+    utils::build_plain_page(
+        buffer,
+        array.len(),
+        array.len(),
+        array.null_count(),
+        0,
+        definition_levels_byte_length,
+        statistics,
+        type_,
+        options,
+        Encoding::Plain,
+    )
+}
+
+pub(super) fn build_statistics(array: &BooleanArray) -> ParquetStatistics {
+    let statistics = &BooleanStatistics {
+        null_count: Some(array.null_count() as i64),
+        distinct_count: None,
+        max_value: array.iter().flatten().max(),
+        min_value: array.iter().flatten().min(),
+    } as &dyn Statistics;
+    serialize_statistics(statistics)
+}
diff --git a/crates/nano-arrow/src/io/parquet/write/boolean/mod.rs b/crates/nano-arrow/src/io/parquet/write/boolean/mod.rs
new file mode 100644
index 000000000000..280e2ff9efb5
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/boolean/mod.rs
@@ -0,0 +1,5 @@
+mod basic;
+mod nested;
+
+pub use basic::array_to_page;
+pub use nested::array_to_page as nested_array_to_page;
diff --git a/crates/nano-arrow/src/io/parquet/write/boolean/nested.rs b/crates/nano-arrow/src/io/parquet/write/boolean/nested.rs
new file mode 100644
index 000000000000..656019100825
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/boolean/nested.rs
@@ -0,0 +1,44 @@
+use parquet2::encoding::Encoding;
+use parquet2::page::DataPage;
+use parquet2::schema::types::PrimitiveType;
+
+use super::super::{nested, utils, WriteOptions};
+use super::basic::{build_statistics, encode_plain};
+use crate::array::{Array, BooleanArray};
+use crate::error::Result;
+use crate::io::parquet::read::schema::is_nullable;
+use crate::io::parquet::write::Nested;
+
+pub fn array_to_page(
+    array: &BooleanArray,
+    options: WriteOptions,
+    type_: PrimitiveType,
+    nested: &[Nested],
+) -> Result<DataPage> {
+    let is_optional = is_nullable(&type_.field_info);
+
+    let mut buffer = vec![];
+    let (repetition_levels_byte_length, definition_levels_byte_length) =
+        nested::write_rep_and_def(options.version, nested, &mut buffer)?;
+
+    encode_plain(array, is_optional, &mut buffer)?;
+
+    let statistics = if options.write_statistics {
+        Some(build_statistics(array))
+    } else {
+        None
+    };
+
+    utils::build_plain_page(
+        buffer,
+        nested::num_values(nested),
+        nested[0].len(),
+        array.null_count(),
+        repetition_levels_byte_length,
+        definition_levels_byte_length,
+        statistics,
+        type_,
+        options,
+        Encoding::Plain,
+    )
+}
diff --git a/crates/nano-arrow/src/io/parquet/write/dictionary.rs b/crates/nano-arrow/src/io/parquet/write/dictionary.rs
new file mode 100644
index 000000000000..4ee0a5c37eac
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/dictionary.rs
@@ -0,0 +1,281 @@
+use parquet2::encoding::hybrid_rle::encode_u32;
+use parquet2::encoding::Encoding;
+use parquet2::page::{DictPage, Page};
+use parquet2::schema::types::PrimitiveType;
+use parquet2::statistics::{serialize_statistics, ParquetStatistics};
+use parquet2::write::DynIter;
+
+use super::binary::{
+    build_statistics as binary_build_statistics, encode_plain as binary_encode_plain,
+};
+use super::fixed_len_bytes::{
+    build_statistics as fixed_binary_build_statistics, encode_plain as fixed_binary_encode_plain,
+};
+use super::primitive::{
+    build_statistics as primitive_build_statistics, encode_plain as primitive_encode_plain,
+};
+use super::utf8::{build_statistics as utf8_build_statistics, encode_plain as utf8_encode_plain};
+use super::{nested, Nested, WriteOptions};
+use crate::array::{Array, DictionaryArray, DictionaryKey};
+use crate::bitmap::{Bitmap, MutableBitmap};
+use crate::datatypes::DataType;
+use crate::error::{Error, Result};
+use crate::io::parquet::read::schema::is_nullable;
+use crate::io::parquet::write::{slice_nested_leaf, utils};
+
+fn serialize_def_levels_simple(
+    validity: Option<&Bitmap>,
+    length: usize,
+    is_optional: bool,
+    options: WriteOptions,
+    buffer: &mut Vec<u8>,
+) -> Result<()> {
+    utils::write_def_levels(buffer, is_optional, validity, length, options.version)
+}
+
+fn serialize_keys_values<K: DictionaryKey>(
+    array: &DictionaryArray<K>,
+    validity: Option<&Bitmap>,
+    buffer: &mut Vec<u8>,
+) -> Result<()> {
+    let keys = array.keys_values_iter().map(|x| x as u32);
+    if let Some(validity) = validity {
+        // discard indices whose values are null.
+        let keys = keys
+            .zip(validity.iter())
+            .filter(|&(_key, is_valid)| is_valid)
+            .map(|(key, _is_valid)| key);
+        let num_bits = utils::get_bit_width(keys.clone().max().unwrap_or(0) as u64);
+
+        let keys = utils::ExactSizedIter::new(keys, array.len() - validity.unset_bits());
+
+        // num_bits as a single byte
+        buffer.push(num_bits as u8);
+
+        // followed by the encoded indices.
+        Ok(encode_u32(buffer, keys, num_bits)?)
+    } else {
+        let num_bits = utils::get_bit_width(keys.clone().max().unwrap_or(0) as u64);
+
+        // num_bits as a single byte
+        buffer.push(num_bits as u8);
+
+        // followed by the encoded indices.
+        Ok(encode_u32(buffer, keys, num_bits)?)
+    }
+}
+
+fn serialize_levels(
+    validity: Option<&Bitmap>,
+    length: usize,
+    type_: &PrimitiveType,
+    nested: &[Nested],
+    options: WriteOptions,
+    buffer: &mut Vec<u8>,
+) -> Result<(usize, usize)> {
+    if nested.len() == 1 {
+        let is_optional = is_nullable(&type_.field_info);
+        serialize_def_levels_simple(validity, length, is_optional, options, buffer)?;
+        let definition_levels_byte_length = buffer.len();
+        Ok((0, definition_levels_byte_length))
+    } else {
+        nested::write_rep_and_def(options.version, nested, buffer)
+    }
+}
+
+fn normalized_validity<K: DictionaryKey>(array: &DictionaryArray<K>) -> Option<Bitmap> {
+    match (array.keys().validity(), array.values().validity()) {
+        (None, None) => None,
+        (None, rhs) => rhs.cloned(),
+        (lhs, None) => lhs.cloned(),
+        (Some(_), Some(rhs)) => {
+            let projected_validity = array
+                .keys_iter()
+                .map(|x| x.map(|x| rhs.get_bit(x)).unwrap_or(false));
+            MutableBitmap::from_trusted_len_iter(projected_validity).into()
+        },
+    }
+}
+
+fn serialize_keys<K: DictionaryKey>(
+    array: &DictionaryArray<K>,
+    type_: PrimitiveType,
+    nested: &[Nested],
+    statistics: Option<ParquetStatistics>,
+    options: WriteOptions,
+) -> Result<Page> {
+    let mut buffer = vec![];
+
+    // parquet only accepts a single validity - we "&" the validities into a single one
+    // and ignore keys whole _value_ is null.
+    let validity = normalized_validity(array);
+    let (start, len) = slice_nested_leaf(nested);
+
+    let mut nested = nested.to_vec();
+    let array = array.clone().sliced(start, len);
+    if let Some(Nested::Primitive(_, _, c)) = nested.last_mut() {
+        *c = len;
+    } else {
+        unreachable!("")
+    }
+
+    let (repetition_levels_byte_length, definition_levels_byte_length) = serialize_levels(
+        validity.as_ref(),
+        array.len(),
+        &type_,
+        &nested,
+        options,
+        &mut buffer,
+    )?;
+
+    serialize_keys_values(&array, validity.as_ref(), &mut buffer)?;
+
+    let (num_values, num_rows) = if nested.len() == 1 {
+        (array.len(), array.len())
+    } else {
+        (nested::num_values(&nested), nested[0].len())
+    };
+
+    utils::build_plain_page(
+        buffer,
+        num_values,
+        num_rows,
+        array.null_count(),
+        repetition_levels_byte_length,
+        definition_levels_byte_length,
+        statistics,
+        type_,
+        options,
+        Encoding::RleDictionary,
+    )
+    .map(Page::Data)
+}
+
+macro_rules! dyn_prim {
+    ($from:ty, $to:ty, $array:expr, $options:expr, $type_:expr) => {{
+        let values = $array.values().as_any().downcast_ref().unwrap();
+
+        let buffer = primitive_encode_plain::<$from, $to>(values, false, vec![]);
+
+        let stats: Option<ParquetStatistics> = if $options.write_statistics {
+            let mut stats = primitive_build_statistics::<$from, $to>(values, $type_.clone());
+            stats.null_count = Some($array.null_count() as i64);
+            let stats = serialize_statistics(&stats);
+            Some(stats)
+        } else {
+            None
+        };
+        (DictPage::new(buffer, values.len(), false), stats)
+    }};
+}
+
+pub fn array_to_pages<K: DictionaryKey>(
+    array: &DictionaryArray<K>,
+    type_: PrimitiveType,
+    nested: &[Nested],
+    options: WriteOptions,
+    encoding: Encoding,
+) -> Result<DynIter<'static, Result<Page>>> {
+    match encoding {
+        Encoding::PlainDictionary | Encoding::RleDictionary => {
+            // write DictPage
+            let (dict_page, statistics): (_, Option<ParquetStatistics>) =
+                match array.values().data_type().to_logical_type() {
+                    DataType::Int8 => dyn_prim!(i8, i32, array, options, type_),
+                    DataType::Int16 => dyn_prim!(i16, i32, array, options, type_),
+                    DataType::Int32 | DataType::Date32 | DataType::Time32(_) => {
+                        dyn_prim!(i32, i32, array, options, type_)
+                    },
+                    DataType::Int64
+                    | DataType::Date64
+                    | DataType::Time64(_)
+                    | DataType::Timestamp(_, _)
+                    | DataType::Duration(_) => dyn_prim!(i64, i64, array, options, type_),
+                    DataType::UInt8 => dyn_prim!(u8, i32, array, options, type_),
+                    DataType::UInt16 => dyn_prim!(u16, i32, array, options, type_),
+                    DataType::UInt32 => dyn_prim!(u32, i32, array, options, type_),
+                    DataType::UInt64 => dyn_prim!(u64, i64, array, options, type_),
+                    DataType::Float32 => dyn_prim!(f32, f32, array, options, type_),
+                    DataType::Float64 => dyn_prim!(f64, f64, array, options, type_),
+                    DataType::Utf8 => {
+                        let array = array.values().as_any().downcast_ref().unwrap();
+
+                        let mut buffer = vec![];
+                        utf8_encode_plain::<i32>(array, false, &mut buffer);
+                        let stats = if options.write_statistics {
+                            Some(utf8_build_statistics(array, type_.clone()))
+                        } else {
+                            None
+                        };
+                        (DictPage::new(buffer, array.len(), false), stats)
+                    },
+                    DataType::LargeUtf8 => {
+                        let array = array.values().as_any().downcast_ref().unwrap();
+
+                        let mut buffer = vec![];
+                        utf8_encode_plain::<i64>(array, false, &mut buffer);
+                        let stats = if options.write_statistics {
+                            Some(utf8_build_statistics(array, type_.clone()))
+                        } else {
+                            None
+                        };
+                        (DictPage::new(buffer, array.len(), false), stats)
+                    },
+                    DataType::Binary => {
+                        let array = array.values().as_any().downcast_ref().unwrap();
+
+                        let mut buffer = vec![];
+                        binary_encode_plain::<i32>(array, false, &mut buffer);
+                        let stats = if options.write_statistics {
+                            Some(binary_build_statistics(array, type_.clone()))
+                        } else {
+                            None
+                        };
+                        (DictPage::new(buffer, array.len(), false), stats)
+                    },
+                    DataType::LargeBinary => {
+                        let values = array.values().as_any().downcast_ref().unwrap();
+
+                        let mut buffer = vec![];
+                        binary_encode_plain::<i64>(values, false, &mut buffer);
+                        let stats = if options.write_statistics {
+                            let mut stats = binary_build_statistics(values, type_.clone());
+                            stats.null_count = Some(array.null_count() as i64);
+                            Some(stats)
+                        } else {
+                            None
+                        };
+                        (DictPage::new(buffer, values.len(), false), stats)
+                    },
+                    DataType::FixedSizeBinary(_) => {
+                        let mut buffer = vec![];
+                        let array = array.values().as_any().downcast_ref().unwrap();
+                        fixed_binary_encode_plain(array, false, &mut buffer);
+                        let stats = if options.write_statistics {
+                            let mut stats = fixed_binary_build_statistics(array, type_.clone());
+                            stats.null_count = Some(array.null_count() as i64);
+                            Some(serialize_statistics(&stats))
+                        } else {
+                            None
+                        };
+                        (DictPage::new(buffer, array.len(), false), stats)
+                    },
+                    other => {
+                        return Err(Error::NotYetImplemented(format!(
+                            "Writing dictionary arrays to parquet only support data type {other:?}"
+                        )))
+                    },
+                };
+            let dict_page = Page::Dict(dict_page);
+
+            // write DataPage pointing to DictPage
+            let data_page = serialize_keys(array, type_, nested, statistics, options)?;
+
+            let iter = std::iter::once(Ok(dict_page)).chain(std::iter::once(Ok(data_page)));
+            Ok(DynIter::new(Box::new(iter)))
+        },
+        _ => Err(Error::NotYetImplemented(
+            "Dictionary arrays only support dictionary encoding".to_string(),
+        )),
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/write/file.rs b/crates/nano-arrow/src/io/parquet/write/file.rs
new file mode 100644
index 000000000000..4ec37b941ad9
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/file.rs
@@ -0,0 +1,95 @@
+use std::io::Write;
+
+use parquet2::metadata::{KeyValue, SchemaDescriptor};
+use parquet2::write::{RowGroupIter, WriteOptions as FileWriteOptions};
+
+use super::schema::schema_to_metadata_key;
+use super::{to_parquet_schema, ThriftFileMetaData, WriteOptions};
+use crate::datatypes::Schema;
+use crate::error::{Error, Result};
+
+/// Attaches [`Schema`] to `key_value_metadata`
+pub fn add_arrow_schema(
+    schema: &Schema,
+    key_value_metadata: Option<Vec<KeyValue>>,
+) -> Option<Vec<KeyValue>> {
+    key_value_metadata
+        .map(|mut x| {
+            x.push(schema_to_metadata_key(schema));
+            x
+        })
+        .or_else(|| Some(vec![schema_to_metadata_key(schema)]))
+}
+
+/// An interface to write a parquet to a [`Write`]
+pub struct FileWriter<W: Write> {
+    writer: parquet2::write::FileWriter<W>,
+    schema: Schema,
+    options: WriteOptions,
+}
+
+// Accessors
+impl<W: Write> FileWriter<W> {
+    /// The options assigned to the file
+    pub fn options(&self) -> WriteOptions {
+        self.options
+    }
+
+    /// The [`SchemaDescriptor`] assigned to this file
+    pub fn parquet_schema(&self) -> &SchemaDescriptor {
+        self.writer.schema()
+    }
+
+    /// The [`Schema`] assigned to this file
+    pub fn schema(&self) -> &Schema {
+        &self.schema
+    }
+}
+
+impl<W: Write> FileWriter<W> {
+    /// Returns a new [`FileWriter`].
+    /// # Error
+    /// If it is unable to derive a parquet schema from [`Schema`].
+    pub fn try_new(writer: W, schema: Schema, options: WriteOptions) -> Result<Self> {
+        let parquet_schema = to_parquet_schema(&schema)?;
+
+        let created_by = Some("Arrow2 - Native Rust implementation of Arrow".to_string());
+
+        Ok(Self {
+            writer: parquet2::write::FileWriter::new(
+                writer,
+                parquet_schema,
+                FileWriteOptions {
+                    version: options.version,
+                    write_statistics: options.write_statistics,
+                },
+                created_by,
+            ),
+            schema,
+            options,
+        })
+    }
+
+    /// Writes a row group to the file.
+    pub fn write(&mut self, row_group: RowGroupIter<'_, Error>) -> Result<()> {
+        Ok(self.writer.write(row_group)?)
+    }
+
+    /// Writes the footer of the parquet file. Returns the total size of the file.
+    pub fn end(&mut self, key_value_metadata: Option<Vec<KeyValue>>) -> Result<u64> {
+        let key_value_metadata = add_arrow_schema(&self.schema, key_value_metadata);
+        Ok(self.writer.end(key_value_metadata)?)
+    }
+
+    /// Consumes this writer and returns the inner writer
+    pub fn into_inner(self) -> W {
+        self.writer.into_inner()
+    }
+
+    /// Returns the underlying writer and [`ThriftFileMetaData`]
+    /// # Panics
+    /// This function panics if [`Self::end`] has not yet been called
+    pub fn into_inner_and_metadata(self) -> (W, ThriftFileMetaData) {
+        self.writer.into_inner_and_metadata()
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/write/fixed_len_bytes.rs b/crates/nano-arrow/src/io/parquet/write/fixed_len_bytes.rs
new file mode 100644
index 000000000000..86080ef7728f
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/fixed_len_bytes.rs
@@ -0,0 +1,147 @@
+use parquet2::encoding::Encoding;
+use parquet2::page::DataPage;
+use parquet2::schema::types::PrimitiveType;
+use parquet2::statistics::{serialize_statistics, FixedLenStatistics};
+
+use super::binary::ord_binary;
+use super::{utils, WriteOptions};
+use crate::array::{Array, FixedSizeBinaryArray, PrimitiveArray};
+use crate::error::Result;
+use crate::io::parquet::read::schema::is_nullable;
+use crate::types::i256;
+
+pub(crate) fn encode_plain(array: &FixedSizeBinaryArray, is_optional: bool, buffer: &mut Vec<u8>) {
+    // append the non-null values
+    if is_optional {
+        array.iter().for_each(|x| {
+            if let Some(x) = x {
+                buffer.extend_from_slice(x);
+            }
+        })
+    } else {
+        buffer.extend_from_slice(array.values());
+    }
+}
+
+pub fn array_to_page(
+    array: &FixedSizeBinaryArray,
+    options: WriteOptions,
+    type_: PrimitiveType,
+    statistics: Option<FixedLenStatistics>,
+) -> Result<DataPage> {
+    let is_optional = is_nullable(&type_.field_info);
+    let validity = array.validity();
+
+    let mut buffer = vec![];
+    utils::write_def_levels(
+        &mut buffer,
+        is_optional,
+        validity,
+        array.len(),
+        options.version,
+    )?;
+
+    let definition_levels_byte_length = buffer.len();
+
+    encode_plain(array, is_optional, &mut buffer);
+
+    utils::build_plain_page(
+        buffer,
+        array.len(),
+        array.len(),
+        array.null_count(),
+        0,
+        definition_levels_byte_length,
+        statistics.map(|x| serialize_statistics(&x)),
+        type_,
+        options,
+        Encoding::Plain,
+    )
+}
+
+pub(super) fn build_statistics(
+    array: &FixedSizeBinaryArray,
+    primitive_type: PrimitiveType,
+) -> FixedLenStatistics {
+    FixedLenStatistics {
+        primitive_type,
+        null_count: Some(array.null_count() as i64),
+        distinct_count: None,
+        max_value: array
+            .iter()
+            .flatten()
+            .max_by(|x, y| ord_binary(x, y))
+            .map(|x| x.to_vec()),
+        min_value: array
+            .iter()
+            .flatten()
+            .min_by(|x, y| ord_binary(x, y))
+            .map(|x| x.to_vec()),
+    }
+}
+
+pub(super) fn build_statistics_decimal(
+    array: &PrimitiveArray<i128>,
+    primitive_type: PrimitiveType,
+    size: usize,
+) -> FixedLenStatistics {
+    FixedLenStatistics {
+        primitive_type,
+        null_count: Some(array.null_count() as i64),
+        distinct_count: None,
+        max_value: array
+            .iter()
+            .flatten()
+            .max()
+            .map(|x| x.to_be_bytes()[16 - size..].to_vec()),
+        min_value: array
+            .iter()
+            .flatten()
+            .min()
+            .map(|x| x.to_be_bytes()[16 - size..].to_vec()),
+    }
+}
+
+pub(super) fn build_statistics_decimal256_with_i128(
+    array: &PrimitiveArray<i256>,
+    primitive_type: PrimitiveType,
+    size: usize,
+) -> FixedLenStatistics {
+    FixedLenStatistics {
+        primitive_type,
+        null_count: Some(array.null_count() as i64),
+        distinct_count: None,
+        max_value: array
+            .iter()
+            .flatten()
+            .max()
+            .map(|x| x.0.low().to_be_bytes()[16 - size..].to_vec()),
+        min_value: array
+            .iter()
+            .flatten()
+            .min()
+            .map(|x| x.0.low().to_be_bytes()[16 - size..].to_vec()),
+    }
+}
+
+pub(super) fn build_statistics_decimal256(
+    array: &PrimitiveArray<i256>,
+    primitive_type: PrimitiveType,
+    size: usize,
+) -> FixedLenStatistics {
+    FixedLenStatistics {
+        primitive_type,
+        null_count: Some(array.null_count() as i64),
+        distinct_count: None,
+        max_value: array
+            .iter()
+            .flatten()
+            .max()
+            .map(|x| x.0.to_be_bytes()[32 - size..].to_vec()),
+        min_value: array
+            .iter()
+            .flatten()
+            .min()
+            .map(|x| x.0.to_be_bytes()[32 - size..].to_vec()),
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/write/mod.rs b/crates/nano-arrow/src/io/parquet/write/mod.rs
new file mode 100644
index 000000000000..b74daea04d7e
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/mod.rs
@@ -0,0 +1,876 @@
+//! APIs to write to Parquet format.
+//!
+//! # Arrow/Parquet Interoperability
+//! As of [parquet-format v2.9](https://github.com/apache/parquet-format/blob/master/LogicalTypes.md)
+//! there are Arrow [DataTypes](crate::datatypes::DataType) which do not have a parquet
+//! representation. These include but are not limited to:
+//! * `DataType::Timestamp(TimeUnit::Second, _)`
+//! * `DataType::Int64`
+//! * `DataType::Duration`
+//! * `DataType::Date64`
+//! * `DataType::Time32(TimeUnit::Second)`
+//!
+//! The use of these arrow types will result in no logical type being stored within a parquet file.
+
+mod binary;
+mod boolean;
+mod dictionary;
+mod file;
+mod fixed_len_bytes;
+mod nested;
+mod pages;
+mod primitive;
+mod row_group;
+mod schema;
+mod sink;
+mod utf8;
+mod utils;
+
+pub use nested::{num_values, write_rep_and_def};
+pub use pages::{to_leaves, to_nested, to_parquet_leaves};
+pub use parquet2::compression::{BrotliLevel, CompressionOptions, GzipLevel, ZstdLevel};
+pub use parquet2::encoding::Encoding;
+pub use parquet2::metadata::{
+    Descriptor, FileMetaData, KeyValue, SchemaDescriptor, ThriftFileMetaData,
+};
+pub use parquet2::page::{CompressedDataPage, CompressedPage, Page};
+use parquet2::schema::types::PrimitiveType as ParquetPrimitiveType;
+pub use parquet2::schema::types::{FieldInfo, ParquetType, PhysicalType as ParquetPhysicalType};
+pub use parquet2::write::{
+    compress, write_metadata_sidecar, Compressor, DynIter, DynStreamingIterator, RowGroupIter,
+    Version,
+};
+pub use parquet2::{fallible_streaming_iterator, FallibleStreamingIterator};
+pub use utils::write_def_levels;
+
+use crate::array::*;
+use crate::datatypes::*;
+use crate::error::{Error, Result};
+use crate::types::{days_ms, i256, NativeType};
+
+/// Currently supported options to write to parquet
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+pub struct WriteOptions {
+    /// Whether to write statistics
+    pub write_statistics: bool,
+    /// The page and file version to use
+    pub version: Version,
+    /// The compression to apply to every page
+    pub compression: CompressionOptions,
+    /// The size to flush a page, defaults to 1024 * 1024 if None
+    pub data_pagesize_limit: Option<usize>,
+}
+
+pub use file::FileWriter;
+pub use pages::{array_to_columns, Nested};
+pub use row_group::{row_group_iter, RowGroupIterator};
+pub use schema::to_parquet_type;
+pub use sink::FileSink;
+
+use crate::compute::aggregate::estimated_bytes_size;
+
+/// returns offset and length to slice the leaf values
+pub fn slice_nested_leaf(nested: &[Nested]) -> (usize, usize) {
+    // find the deepest recursive dremel structure as that one determines how many values we must
+    // take
+    let mut out = (0, 0);
+    for nested in nested.iter().rev() {
+        match nested {
+            Nested::LargeList(l_nested) => {
+                let start = *l_nested.offsets.first();
+                let end = *l_nested.offsets.last();
+                return (start as usize, (end - start) as usize);
+            },
+            Nested::List(l_nested) => {
+                let start = *l_nested.offsets.first();
+                let end = *l_nested.offsets.last();
+                return (start as usize, (end - start) as usize);
+            },
+            Nested::Primitive(_, _, len) => out = (0, *len),
+            _ => {},
+        }
+    }
+    out
+}
+
+fn decimal_length_from_precision(precision: usize) -> usize {
+    // digits = floor(log_10(2^(8*n - 1) - 1))
+    // ceil(digits) = log10(2^(8*n - 1) - 1)
+    // 10^ceil(digits) = 2^(8*n - 1) - 1
+    // 10^ceil(digits) + 1 = 2^(8*n - 1)
+    // log2(10^ceil(digits) + 1) = (8*n - 1)
+    // log2(10^ceil(digits) + 1) + 1 = 8*n
+    // (log2(10^ceil(a) + 1) + 1) / 8 = n
+    (((10.0_f64.powi(precision as i32) + 1.0).log2() + 1.0) / 8.0).ceil() as usize
+}
+
+/// Creates a parquet [`SchemaDescriptor`] from a [`Schema`].
+pub fn to_parquet_schema(schema: &Schema) -> Result<SchemaDescriptor> {
+    let parquet_types = schema
+        .fields
+        .iter()
+        .map(to_parquet_type)
+        .collect::<Result<Vec<_>>>()?;
+    Ok(SchemaDescriptor::new("root".to_string(), parquet_types))
+}
+
+/// Checks whether the `data_type` can be encoded as `encoding`.
+/// Note that this is whether this implementation supports it, which is a subset of
+/// what the parquet spec allows.
+pub fn can_encode(data_type: &DataType, encoding: Encoding) -> bool {
+    if let (Encoding::DeltaBinaryPacked, DataType::Decimal(p, _)) =
+        (encoding, data_type.to_logical_type())
+    {
+        return *p <= 18;
+    };
+
+    matches!(
+        (encoding, data_type.to_logical_type()),
+        (Encoding::Plain, _)
+            | (
+                Encoding::DeltaLengthByteArray,
+                DataType::Binary | DataType::LargeBinary | DataType::Utf8 | DataType::LargeUtf8,
+            )
+            | (Encoding::RleDictionary, DataType::Dictionary(_, _, _))
+            | (Encoding::PlainDictionary, DataType::Dictionary(_, _, _))
+            | (
+                Encoding::DeltaBinaryPacked,
+                DataType::Null
+                    | DataType::UInt8
+                    | DataType::UInt16
+                    | DataType::UInt32
+                    | DataType::UInt64
+                    | DataType::Int8
+                    | DataType::Int16
+                    | DataType::Int32
+                    | DataType::Date32
+                    | DataType::Time32(_)
+                    | DataType::Int64
+                    | DataType::Date64
+                    | DataType::Time64(_)
+                    | DataType::Timestamp(_, _)
+                    | DataType::Duration(_)
+            )
+    )
+}
+
+/// Slices the [`Array`] to `Box<dyn Array>` and `Vec<Nested>`.
+pub fn slice_parquet_array(
+    primitive_array: &mut dyn Array,
+    nested: &mut [Nested],
+    mut current_offset: usize,
+    mut current_length: usize,
+) {
+    for nested in nested.iter_mut() {
+        match nested {
+            Nested::LargeList(l_nested) => {
+                l_nested.offsets.slice(current_offset, current_length + 1);
+                if let Some(validity) = l_nested.validity.as_mut() {
+                    validity.slice(current_offset, current_length)
+                };
+
+                current_length = l_nested.offsets.range() as usize;
+                current_offset = *l_nested.offsets.first() as usize;
+            },
+            Nested::List(l_nested) => {
+                l_nested.offsets.slice(current_offset, current_length + 1);
+                if let Some(validity) = l_nested.validity.as_mut() {
+                    validity.slice(current_offset, current_length)
+                };
+
+                current_length = l_nested.offsets.range() as usize;
+                current_offset = *l_nested.offsets.first() as usize;
+            },
+            Nested::Struct(validity, _, length) => {
+                *length = current_length;
+                if let Some(validity) = validity.as_mut() {
+                    validity.slice(current_offset, current_length)
+                };
+            },
+            Nested::Primitive(validity, _, length) => {
+                *length = current_length;
+                if let Some(validity) = validity.as_mut() {
+                    validity.slice(current_offset, current_length)
+                };
+                primitive_array.slice(current_offset, current_length);
+            },
+        }
+    }
+}
+
+/// Get the length of [`Array`] that should be sliced.
+pub fn get_max_length(nested: &[Nested]) -> usize {
+    let mut length = 0;
+    for nested in nested.iter() {
+        match nested {
+            Nested::LargeList(l_nested) => length += l_nested.offsets.range() as usize,
+            Nested::List(l_nested) => length += l_nested.offsets.range() as usize,
+            _ => {},
+        }
+    }
+    length
+}
+
+/// Returns an iterator of [`Page`].
+pub fn array_to_pages(
+    primitive_array: &dyn Array,
+    type_: ParquetPrimitiveType,
+    nested: &[Nested],
+    options: WriteOptions,
+    encoding: Encoding,
+) -> Result<DynIter<'static, Result<Page>>> {
+    if let DataType::Dictionary(key_type, _, _) = primitive_array.data_type().to_logical_type() {
+        return match_integer_type!(key_type, |$T| {
+            dictionary::array_to_pages::<$T>(
+                primitive_array.as_any().downcast_ref().unwrap(),
+                type_,
+                &nested,
+                options,
+                encoding,
+            )
+        });
+    };
+
+    let nested = nested.to_vec();
+    let primitive_array = primitive_array.to_boxed();
+
+    let number_of_rows = nested[0].len();
+
+    // note: this is not correct if the array is sliced - the estimation should happen on the
+    // primitive after sliced for parquet
+    let byte_size = estimated_bytes_size(primitive_array.as_ref());
+
+    const DEFAULT_PAGE_SIZE: usize = 1024 * 1024;
+    let max_page_size = options.data_pagesize_limit.unwrap_or(DEFAULT_PAGE_SIZE);
+    let max_page_size = max_page_size.min(2usize.pow(31) - 2usize.pow(25)); // allowed maximum page size
+    let bytes_per_row = if number_of_rows == 0 {
+        0
+    } else {
+        ((byte_size as f64) / (number_of_rows as f64)) as usize
+    };
+    let rows_per_page = (max_page_size / (bytes_per_row + 1)).max(1);
+
+    let pages = (0..number_of_rows)
+        .step_by(rows_per_page)
+        .map(move |offset| {
+            let length = if offset + rows_per_page > number_of_rows {
+                number_of_rows - offset
+            } else {
+                rows_per_page
+            };
+
+            let mut right_array = primitive_array.clone();
+            let mut right_nested = nested.clone();
+            slice_parquet_array(right_array.as_mut(), &mut right_nested, offset, length);
+
+            array_to_page(
+                right_array.as_ref(),
+                type_.clone(),
+                &right_nested,
+                options,
+                encoding,
+            )
+        });
+
+    Ok(DynIter::new(pages))
+}
+
+/// Converts an [`Array`] to a [`CompressedPage`] based on options, descriptor and `encoding`.
+pub fn array_to_page(
+    array: &dyn Array,
+    type_: ParquetPrimitiveType,
+    nested: &[Nested],
+    options: WriteOptions,
+    encoding: Encoding,
+) -> Result<Page> {
+    if nested.len() == 1 {
+        // special case where validity == def levels
+        return array_to_page_simple(array, type_, options, encoding);
+    }
+    array_to_page_nested(array, type_, nested, options, encoding)
+}
+
+/// Converts an [`Array`] to a [`CompressedPage`] based on options, descriptor and `encoding`.
+pub fn array_to_page_simple(
+    array: &dyn Array,
+    type_: ParquetPrimitiveType,
+    options: WriteOptions,
+    encoding: Encoding,
+) -> Result<Page> {
+    let data_type = array.data_type();
+    if !can_encode(data_type, encoding) {
+        return Err(Error::InvalidArgumentError(format!(
+            "The datatype {data_type:?} cannot be encoded by {encoding:?}"
+        )));
+    }
+
+    match data_type.to_logical_type() {
+        DataType::Boolean => {
+            boolean::array_to_page(array.as_any().downcast_ref().unwrap(), options, type_)
+        },
+        // casts below MUST match the casts done at the metadata (field -> parquet type).
+        DataType::UInt8 => primitive::array_to_page_integer::<u8, i32>(
+            array.as_any().downcast_ref().unwrap(),
+            options,
+            type_,
+            encoding,
+        ),
+        DataType::UInt16 => primitive::array_to_page_integer::<u16, i32>(
+            array.as_any().downcast_ref().unwrap(),
+            options,
+            type_,
+            encoding,
+        ),
+        DataType::UInt32 => primitive::array_to_page_integer::<u32, i32>(
+            array.as_any().downcast_ref().unwrap(),
+            options,
+            type_,
+            encoding,
+        ),
+        DataType::UInt64 => primitive::array_to_page_integer::<u64, i64>(
+            array.as_any().downcast_ref().unwrap(),
+            options,
+            type_,
+            encoding,
+        ),
+        DataType::Int8 => primitive::array_to_page_integer::<i8, i32>(
+            array.as_any().downcast_ref().unwrap(),
+            options,
+            type_,
+            encoding,
+        ),
+        DataType::Int16 => primitive::array_to_page_integer::<i16, i32>(
+            array.as_any().downcast_ref().unwrap(),
+            options,
+            type_,
+            encoding,
+        ),
+        DataType::Int32 | DataType::Date32 | DataType::Time32(_) => {
+            primitive::array_to_page_integer::<i32, i32>(
+                array.as_any().downcast_ref().unwrap(),
+                options,
+                type_,
+                encoding,
+            )
+        },
+        DataType::Int64
+        | DataType::Date64
+        | DataType::Time64(_)
+        | DataType::Timestamp(_, _)
+        | DataType::Duration(_) => primitive::array_to_page_integer::<i64, i64>(
+            array.as_any().downcast_ref().unwrap(),
+            options,
+            type_,
+            encoding,
+        ),
+        DataType::Float32 => primitive::array_to_page_plain::<f32, f32>(
+            array.as_any().downcast_ref().unwrap(),
+            options,
+            type_,
+        ),
+        DataType::Float64 => primitive::array_to_page_plain::<f64, f64>(
+            array.as_any().downcast_ref().unwrap(),
+            options,
+            type_,
+        ),
+        DataType::Utf8 => utf8::array_to_page::<i32>(
+            array.as_any().downcast_ref().unwrap(),
+            options,
+            type_,
+            encoding,
+        ),
+        DataType::LargeUtf8 => utf8::array_to_page::<i64>(
+            array.as_any().downcast_ref().unwrap(),
+            options,
+            type_,
+            encoding,
+        ),
+        DataType::Binary => binary::array_to_page::<i32>(
+            array.as_any().downcast_ref().unwrap(),
+            options,
+            type_,
+            encoding,
+        ),
+        DataType::LargeBinary => binary::array_to_page::<i64>(
+            array.as_any().downcast_ref().unwrap(),
+            options,
+            type_,
+            encoding,
+        ),
+        DataType::Null => {
+            let array = Int32Array::new_null(DataType::Int32, array.len());
+            primitive::array_to_page_plain::<i32, i32>(&array, options, type_)
+        },
+        DataType::Interval(IntervalUnit::YearMonth) => {
+            let array = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<i32>>()
+                .unwrap();
+            let mut values = Vec::<u8>::with_capacity(12 * array.len());
+            array.values().iter().for_each(|x| {
+                let bytes = &x.to_le_bytes();
+                values.extend_from_slice(bytes);
+                values.extend_from_slice(&[0; 8]);
+            });
+            let array = FixedSizeBinaryArray::new(
+                DataType::FixedSizeBinary(12),
+                values.into(),
+                array.validity().cloned(),
+            );
+            let statistics = if options.write_statistics {
+                Some(fixed_len_bytes::build_statistics(&array, type_.clone()))
+            } else {
+                None
+            };
+            fixed_len_bytes::array_to_page(&array, options, type_, statistics)
+        },
+        DataType::Interval(IntervalUnit::DayTime) => {
+            let array = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<days_ms>>()
+                .unwrap();
+            let mut values = Vec::<u8>::with_capacity(12 * array.len());
+            array.values().iter().for_each(|x| {
+                let bytes = &x.to_le_bytes();
+                values.extend_from_slice(&[0; 4]); // months
+                values.extend_from_slice(bytes); // days and seconds
+            });
+            let array = FixedSizeBinaryArray::new(
+                DataType::FixedSizeBinary(12),
+                values.into(),
+                array.validity().cloned(),
+            );
+            let statistics = if options.write_statistics {
+                Some(fixed_len_bytes::build_statistics(&array, type_.clone()))
+            } else {
+                None
+            };
+            fixed_len_bytes::array_to_page(&array, options, type_, statistics)
+        },
+        DataType::FixedSizeBinary(_) => {
+            let array = array.as_any().downcast_ref().unwrap();
+            let statistics = if options.write_statistics {
+                Some(fixed_len_bytes::build_statistics(array, type_.clone()))
+            } else {
+                None
+            };
+
+            fixed_len_bytes::array_to_page(array, options, type_, statistics)
+        },
+        DataType::Decimal256(precision, _) => {
+            let precision = *precision;
+            let array = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<i256>>()
+                .unwrap();
+            if precision <= 9 {
+                let values = array
+                    .values()
+                    .iter()
+                    .map(|x| x.0.as_i32())
+                    .collect::<Vec<_>>()
+                    .into();
+
+                let array =
+                    PrimitiveArray::<i32>::new(DataType::Int32, values, array.validity().cloned());
+                primitive::array_to_page_integer::<i32, i32>(&array, options, type_, encoding)
+            } else if precision <= 18 {
+                let values = array
+                    .values()
+                    .iter()
+                    .map(|x| x.0.as_i64())
+                    .collect::<Vec<_>>()
+                    .into();
+
+                let array =
+                    PrimitiveArray::<i64>::new(DataType::Int64, values, array.validity().cloned());
+                primitive::array_to_page_integer::<i64, i64>(&array, options, type_, encoding)
+            } else if precision <= 38 {
+                let size = decimal_length_from_precision(precision);
+                let statistics = if options.write_statistics {
+                    let stats = fixed_len_bytes::build_statistics_decimal256_with_i128(
+                        array,
+                        type_.clone(),
+                        size,
+                    );
+                    Some(stats)
+                } else {
+                    None
+                };
+
+                let mut values = Vec::<u8>::with_capacity(size * array.len());
+                array.values().iter().for_each(|x| {
+                    let bytes = &x.0.low().to_be_bytes()[16 - size..];
+                    values.extend_from_slice(bytes)
+                });
+                let array = FixedSizeBinaryArray::new(
+                    DataType::FixedSizeBinary(size),
+                    values.into(),
+                    array.validity().cloned(),
+                );
+                fixed_len_bytes::array_to_page(&array, options, type_, statistics)
+            } else {
+                let size = 32;
+                let array = array
+                    .as_any()
+                    .downcast_ref::<PrimitiveArray<i256>>()
+                    .unwrap();
+                let statistics = if options.write_statistics {
+                    let stats =
+                        fixed_len_bytes::build_statistics_decimal256(array, type_.clone(), size);
+                    Some(stats)
+                } else {
+                    None
+                };
+                let mut values = Vec::<u8>::with_capacity(size * array.len());
+                array.values().iter().for_each(|x| {
+                    let bytes = &x.to_be_bytes();
+                    values.extend_from_slice(bytes)
+                });
+                let array = FixedSizeBinaryArray::new(
+                    DataType::FixedSizeBinary(size),
+                    values.into(),
+                    array.validity().cloned(),
+                );
+
+                fixed_len_bytes::array_to_page(&array, options, type_, statistics)
+            }
+        },
+        DataType::Decimal(precision, _) => {
+            let precision = *precision;
+            let array = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<i128>>()
+                .unwrap();
+            if precision <= 9 {
+                let values = array
+                    .values()
+                    .iter()
+                    .map(|x| *x as i32)
+                    .collect::<Vec<_>>()
+                    .into();
+
+                let array =
+                    PrimitiveArray::<i32>::new(DataType::Int32, values, array.validity().cloned());
+                primitive::array_to_page_integer::<i32, i32>(&array, options, type_, encoding)
+            } else if precision <= 18 {
+                let values = array
+                    .values()
+                    .iter()
+                    .map(|x| *x as i64)
+                    .collect::<Vec<_>>()
+                    .into();
+
+                let array =
+                    PrimitiveArray::<i64>::new(DataType::Int64, values, array.validity().cloned());
+                primitive::array_to_page_integer::<i64, i64>(&array, options, type_, encoding)
+            } else {
+                let size = decimal_length_from_precision(precision);
+
+                let statistics = if options.write_statistics {
+                    let stats =
+                        fixed_len_bytes::build_statistics_decimal(array, type_.clone(), size);
+                    Some(stats)
+                } else {
+                    None
+                };
+
+                let mut values = Vec::<u8>::with_capacity(size * array.len());
+                array.values().iter().for_each(|x| {
+                    let bytes = &x.to_be_bytes()[16 - size..];
+                    values.extend_from_slice(bytes)
+                });
+                let array = FixedSizeBinaryArray::new(
+                    DataType::FixedSizeBinary(size),
+                    values.into(),
+                    array.validity().cloned(),
+                );
+                fixed_len_bytes::array_to_page(&array, options, type_, statistics)
+            }
+        },
+        other => Err(Error::NotYetImplemented(format!(
+            "Writing parquet pages for data type {other:?}"
+        ))),
+    }
+    .map(Page::Data)
+}
+
+fn array_to_page_nested(
+    array: &dyn Array,
+    type_: ParquetPrimitiveType,
+    nested: &[Nested],
+    options: WriteOptions,
+    _encoding: Encoding,
+) -> Result<Page> {
+    use DataType::*;
+    match array.data_type().to_logical_type() {
+        Null => {
+            let array = Int32Array::new_null(DataType::Int32, array.len());
+            primitive::nested_array_to_page::<i32, i32>(&array, options, type_, nested)
+        },
+        Boolean => {
+            let array = array.as_any().downcast_ref().unwrap();
+            boolean::nested_array_to_page(array, options, type_, nested)
+        },
+        Utf8 => {
+            let array = array.as_any().downcast_ref().unwrap();
+            utf8::nested_array_to_page::<i32>(array, options, type_, nested)
+        },
+        LargeUtf8 => {
+            let array = array.as_any().downcast_ref().unwrap();
+            utf8::nested_array_to_page::<i64>(array, options, type_, nested)
+        },
+        Binary => {
+            let array = array.as_any().downcast_ref().unwrap();
+            binary::nested_array_to_page::<i32>(array, options, type_, nested)
+        },
+        LargeBinary => {
+            let array = array.as_any().downcast_ref().unwrap();
+            binary::nested_array_to_page::<i64>(array, options, type_, nested)
+        },
+        UInt8 => {
+            let array = array.as_any().downcast_ref().unwrap();
+            primitive::nested_array_to_page::<u8, i32>(array, options, type_, nested)
+        },
+        UInt16 => {
+            let array = array.as_any().downcast_ref().unwrap();
+            primitive::nested_array_to_page::<u16, i32>(array, options, type_, nested)
+        },
+        UInt32 => {
+            let array = array.as_any().downcast_ref().unwrap();
+            primitive::nested_array_to_page::<u32, i32>(array, options, type_, nested)
+        },
+        UInt64 => {
+            let array = array.as_any().downcast_ref().unwrap();
+            primitive::nested_array_to_page::<u64, i64>(array, options, type_, nested)
+        },
+        Int8 => {
+            let array = array.as_any().downcast_ref().unwrap();
+            primitive::nested_array_to_page::<i8, i32>(array, options, type_, nested)
+        },
+        Int16 => {
+            let array = array.as_any().downcast_ref().unwrap();
+            primitive::nested_array_to_page::<i16, i32>(array, options, type_, nested)
+        },
+        Int32 | Date32 | Time32(_) => {
+            let array = array.as_any().downcast_ref().unwrap();
+            primitive::nested_array_to_page::<i32, i32>(array, options, type_, nested)
+        },
+        Int64 | Date64 | Time64(_) | Timestamp(_, _) | Duration(_) => {
+            let array = array.as_any().downcast_ref().unwrap();
+            primitive::nested_array_to_page::<i64, i64>(array, options, type_, nested)
+        },
+        Float32 => {
+            let array = array.as_any().downcast_ref().unwrap();
+            primitive::nested_array_to_page::<f32, f32>(array, options, type_, nested)
+        },
+        Float64 => {
+            let array = array.as_any().downcast_ref().unwrap();
+            primitive::nested_array_to_page::<f64, f64>(array, options, type_, nested)
+        },
+        Decimal(precision, _) => {
+            let precision = *precision;
+            let array = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<i128>>()
+                .unwrap();
+            if precision <= 9 {
+                let values = array
+                    .values()
+                    .iter()
+                    .map(|x| *x as i32)
+                    .collect::<Vec<_>>()
+                    .into();
+
+                let array =
+                    PrimitiveArray::<i32>::new(DataType::Int32, values, array.validity().cloned());
+                primitive::nested_array_to_page::<i32, i32>(&array, options, type_, nested)
+            } else if precision <= 18 {
+                let values = array
+                    .values()
+                    .iter()
+                    .map(|x| *x as i64)
+                    .collect::<Vec<_>>()
+                    .into();
+
+                let array =
+                    PrimitiveArray::<i64>::new(DataType::Int64, values, array.validity().cloned());
+                primitive::nested_array_to_page::<i64, i64>(&array, options, type_, nested)
+            } else {
+                let size = decimal_length_from_precision(precision);
+
+                let statistics = if options.write_statistics {
+                    let stats =
+                        fixed_len_bytes::build_statistics_decimal(array, type_.clone(), size);
+                    Some(stats)
+                } else {
+                    None
+                };
+
+                let mut values = Vec::<u8>::with_capacity(size * array.len());
+                array.values().iter().for_each(|x| {
+                    let bytes = &x.to_be_bytes()[16 - size..];
+                    values.extend_from_slice(bytes)
+                });
+                let array = FixedSizeBinaryArray::new(
+                    DataType::FixedSizeBinary(size),
+                    values.into(),
+                    array.validity().cloned(),
+                );
+                fixed_len_bytes::array_to_page(&array, options, type_, statistics)
+            }
+        },
+        Decimal256(precision, _) => {
+            let precision = *precision;
+            let array = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<i256>>()
+                .unwrap();
+            if precision <= 9 {
+                let values = array
+                    .values()
+                    .iter()
+                    .map(|x| x.0.as_i32())
+                    .collect::<Vec<_>>()
+                    .into();
+
+                let array =
+                    PrimitiveArray::<i32>::new(DataType::Int32, values, array.validity().cloned());
+                primitive::nested_array_to_page::<i32, i32>(&array, options, type_, nested)
+            } else if precision <= 18 {
+                let values = array
+                    .values()
+                    .iter()
+                    .map(|x| x.0.as_i64())
+                    .collect::<Vec<_>>()
+                    .into();
+
+                let array =
+                    PrimitiveArray::<i64>::new(DataType::Int64, values, array.validity().cloned());
+                primitive::nested_array_to_page::<i64, i64>(&array, options, type_, nested)
+            } else if precision <= 38 {
+                let size = decimal_length_from_precision(precision);
+                let statistics = if options.write_statistics {
+                    let stats = fixed_len_bytes::build_statistics_decimal256_with_i128(
+                        array,
+                        type_.clone(),
+                        size,
+                    );
+                    Some(stats)
+                } else {
+                    None
+                };
+
+                let mut values = Vec::<u8>::with_capacity(size * array.len());
+                array.values().iter().for_each(|x| {
+                    let bytes = &x.0.low().to_be_bytes()[16 - size..];
+                    values.extend_from_slice(bytes)
+                });
+                let array = FixedSizeBinaryArray::new(
+                    DataType::FixedSizeBinary(size),
+                    values.into(),
+                    array.validity().cloned(),
+                );
+                fixed_len_bytes::array_to_page(&array, options, type_, statistics)
+            } else {
+                let size = 32;
+                let array = array
+                    .as_any()
+                    .downcast_ref::<PrimitiveArray<i256>>()
+                    .unwrap();
+                let statistics = if options.write_statistics {
+                    let stats =
+                        fixed_len_bytes::build_statistics_decimal256(array, type_.clone(), size);
+                    Some(stats)
+                } else {
+                    None
+                };
+                let mut values = Vec::<u8>::with_capacity(size * array.len());
+                array.values().iter().for_each(|x| {
+                    let bytes = &x.to_be_bytes();
+                    values.extend_from_slice(bytes)
+                });
+                let array = FixedSizeBinaryArray::new(
+                    DataType::FixedSizeBinary(size),
+                    values.into(),
+                    array.validity().cloned(),
+                );
+
+                fixed_len_bytes::array_to_page(&array, options, type_, statistics)
+            }
+        },
+        other => Err(Error::NotYetImplemented(format!(
+            "Writing nested parquet pages for data type {other:?}"
+        ))),
+    }
+    .map(Page::Data)
+}
+
+fn transverse_recursive<T, F: Fn(&DataType) -> T + Clone>(
+    data_type: &DataType,
+    map: F,
+    encodings: &mut Vec<T>,
+) {
+    use crate::datatypes::PhysicalType::*;
+    match data_type.to_physical_type() {
+        Null | Boolean | Primitive(_) | Binary | FixedSizeBinary | LargeBinary | Utf8
+        | Dictionary(_) | LargeUtf8 => encodings.push(map(data_type)),
+        List | FixedSizeList | LargeList => {
+            let a = data_type.to_logical_type();
+            if let DataType::List(inner) = a {
+                transverse_recursive(&inner.data_type, map, encodings)
+            } else if let DataType::LargeList(inner) = a {
+                transverse_recursive(&inner.data_type, map, encodings)
+            } else if let DataType::FixedSizeList(inner, _) = a {
+                transverse_recursive(&inner.data_type, map, encodings)
+            } else {
+                unreachable!()
+            }
+        },
+        Struct => {
+            if let DataType::Struct(fields) = data_type.to_logical_type() {
+                for field in fields {
+                    transverse_recursive(&field.data_type, map.clone(), encodings)
+                }
+            } else {
+                unreachable!()
+            }
+        },
+        Map => {
+            if let DataType::Map(field, _) = data_type.to_logical_type() {
+                if let DataType::Struct(fields) = field.data_type.to_logical_type() {
+                    for field in fields {
+                        transverse_recursive(&field.data_type, map.clone(), encodings)
+                    }
+                } else {
+                    unreachable!()
+                }
+            } else {
+                unreachable!()
+            }
+        },
+        Union => todo!(),
+    }
+}
+
+/// Transverses the `data_type` up to its (parquet) columns and returns a vector of
+/// items based on `map`.
+/// This is used to assign an [`Encoding`] to every parquet column based on the columns' type (see example)
+/// # Example
+/// ```
+/// use arrow2::io::parquet::write::{transverse, Encoding};
+/// use arrow2::datatypes::{DataType, Field};
+///
+/// let dt = DataType::Struct(vec![
+///     Field::new("a", DataType::Int64, true),
+///     Field::new("b", DataType::List(Box::new(Field::new("item", DataType::Int32, true))), true),
+/// ]);
+///
+/// let encodings = transverse(&dt, |dt| Encoding::Plain);
+/// assert_eq!(encodings, vec![Encoding::Plain, Encoding::Plain]);
+/// ```
+pub fn transverse<T, F: Fn(&DataType) -> T + Clone>(data_type: &DataType, map: F) -> Vec<T> {
+    let mut encodings = vec![];
+    transverse_recursive(data_type, map, &mut encodings);
+    encodings
+}
diff --git a/crates/nano-arrow/src/io/parquet/write/nested/def.rs b/crates/nano-arrow/src/io/parquet/write/nested/def.rs
new file mode 100644
index 000000000000..02947dd5bef9
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/nested/def.rs
@@ -0,0 +1,584 @@
+use super::super::pages::{ListNested, Nested};
+use super::rep::num_values;
+use super::to_length;
+use crate::bitmap::Bitmap;
+use crate::offset::Offset;
+
+trait DebugIter: Iterator<Item = (u32, usize)> + std::fmt::Debug {}
+
+impl<A: Iterator<Item = (u32, usize)> + std::fmt::Debug> DebugIter for A {}
+
+fn single_iter<'a>(
+    validity: &'a Option<Bitmap>,
+    is_optional: bool,
+    length: usize,
+) -> Box<dyn DebugIter + 'a> {
+    match (is_optional, validity) {
+        (false, _) => {
+            Box::new(std::iter::repeat((0u32, 1usize)).take(length)) as Box<dyn DebugIter>
+        },
+        (true, None) => {
+            Box::new(std::iter::repeat((1u32, 1usize)).take(length)) as Box<dyn DebugIter>
+        },
+        (true, Some(validity)) => {
+            Box::new(validity.iter().map(|v| (v as u32, 1usize)).take(length)) as Box<dyn DebugIter>
+        },
+    }
+}
+
+fn single_list_iter<'a, O: Offset>(nested: &'a ListNested<O>) -> Box<dyn DebugIter + 'a> {
+    match (nested.is_optional, &nested.validity) {
+        (false, _) => Box::new(
+            std::iter::repeat(0u32)
+                .zip(to_length(&nested.offsets))
+                .map(|(a, b)| (a + (b != 0) as u32, b)),
+        ) as Box<dyn DebugIter>,
+        (true, None) => Box::new(
+            std::iter::repeat(1u32)
+                .zip(to_length(&nested.offsets))
+                .map(|(a, b)| (a + (b != 0) as u32, b)),
+        ) as Box<dyn DebugIter>,
+        (true, Some(validity)) => Box::new(
+            validity
+                .iter()
+                .map(|x| (x as u32))
+                .zip(to_length(&nested.offsets))
+                .map(|(a, b)| (a + (b != 0) as u32, b)),
+        ) as Box<dyn DebugIter>,
+    }
+}
+
+fn iter<'a>(nested: &'a [Nested]) -> Vec<Box<dyn DebugIter + 'a>> {
+    nested
+        .iter()
+        .map(|nested| match nested {
+            Nested::Primitive(validity, is_optional, length) => {
+                single_iter(validity, *is_optional, *length)
+            },
+            Nested::List(nested) => single_list_iter(nested),
+            Nested::LargeList(nested) => single_list_iter(nested),
+            Nested::Struct(validity, is_optional, length) => {
+                single_iter(validity, *is_optional, *length)
+            },
+        })
+        .collect()
+}
+
+/// Iterator adapter of parquet / dremel definition levels
+#[derive(Debug)]
+pub struct DefLevelsIter<'a> {
+    // iterators of validities and lengths. E.g. [[[None,b,c], None], None] -> [[(true, 2), (false, 0)], [(true, 3), (false, 0)], [(false, 1), (true, 1), (true, 1)]]
+    iter: Vec<Box<dyn DebugIter + 'a>>,
+    // vector containing the remaining number of values of each iterator.
+    // e.g. the iters [[2, 2], [3, 4, 1, 2]] after the first iteration will return [2, 3],
+    // and remaining will be [2, 3].
+    // on the second iteration, it will be `[2, 2]` (since iterations consume the last items)
+    remaining: Vec<usize>, /* < remaining.len() == iter.len() */
+    validity: Vec<u32>,
+    // cache of the first `remaining` that is non-zero. Examples:
+    // * `remaining = [2, 2] => current_level = 2`
+    // * `remaining = [2, 0] => current_level = 1`
+    // * `remaining = [0, 0] => current_level = 0`
+    current_level: usize, /* < iter.len() */
+    // the total definition level at any given point during the iteration
+    total: u32, /* < iter.len() */
+    // the total number of items that this iterator will return
+    remaining_values: usize,
+}
+
+impl<'a> DefLevelsIter<'a> {
+    pub fn new(nested: &'a [Nested]) -> Self {
+        let remaining_values = num_values(nested);
+
+        let iter = iter(nested);
+        let remaining = vec![0; iter.len()];
+        let validity = vec![0; iter.len()];
+
+        Self {
+            iter,
+            remaining,
+            validity,
+            total: 0,
+            current_level: 0,
+            remaining_values,
+        }
+    }
+}
+
+impl<'a> Iterator for DefLevelsIter<'a> {
+    type Item = u32;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        if self.remaining_values == 0 {
+            return None;
+        }
+
+        if self.remaining.is_empty() {
+            self.remaining_values -= 1;
+            return Some(0);
+        }
+
+        let mut empty_contrib = 0u32;
+        for ((iter, remaining), validity) in self
+            .iter
+            .iter_mut()
+            .zip(self.remaining.iter_mut())
+            .zip(self.validity.iter_mut())
+            .skip(self.current_level)
+        {
+            let (is_valid, length): (u32, usize) = iter.next()?;
+            *validity = is_valid;
+            self.total += is_valid;
+
+            *remaining = length;
+            if length == 0 {
+                *validity = 0;
+                self.total -= is_valid;
+                empty_contrib = is_valid;
+                break;
+            }
+            self.current_level += 1;
+        }
+
+        // track
+        if let Some(x) = self.remaining.get_mut(self.current_level.saturating_sub(1)) {
+            *x = x.saturating_sub(1)
+        }
+
+        let r = Some(self.total + empty_contrib);
+
+        for index in (1..self.current_level).rev() {
+            if self.remaining[index] == 0 {
+                self.current_level -= 1;
+                self.remaining[index - 1] -= 1;
+                self.total -= self.validity[index];
+            }
+        }
+        if self.remaining[0] == 0 {
+            self.current_level = self.current_level.saturating_sub(1);
+            self.total -= self.validity[0];
+        }
+        self.remaining_values -= 1;
+        r
+    }
+
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        let length = self.remaining_values;
+        (length, Some(length))
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    fn test(nested: Vec<Nested>, expected: Vec<u32>) {
+        let mut iter = DefLevelsIter::new(&nested);
+        assert_eq!(iter.size_hint().0, expected.len());
+        let result = iter.by_ref().collect::<Vec<_>>();
+        assert_eq!(result, expected);
+        assert_eq!(iter.size_hint().0, 0);
+    }
+
+    #[test]
+    fn struct_optional() {
+        let b = [
+            true, false, true, true, false, true, false, false, true, true,
+        ];
+        let nested = vec![
+            Nested::Struct(None, true, 10),
+            Nested::Primitive(Some(b.into()), true, 10),
+        ];
+        let expected = vec![2, 1, 2, 2, 1, 2, 1, 1, 2, 2];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn nested_edge_simple() {
+        let nested = vec![
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 2].try_into().unwrap(),
+                validity: None,
+            }),
+            Nested::Primitive(None, true, 2),
+        ];
+        let expected = vec![3, 3];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn struct_optional_1() {
+        let b = [
+            true, false, true, true, false, true, false, false, true, true,
+        ];
+        let nested = vec![
+            Nested::Struct(None, true, 10),
+            Nested::Primitive(Some(b.into()), true, 10),
+        ];
+        let expected = vec![2, 1, 2, 2, 1, 2, 1, 1, 2, 2];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn struct_optional_optional() {
+        let nested = vec![
+            Nested::Struct(None, true, 10),
+            Nested::Primitive(None, true, 10),
+        ];
+        let expected = vec![2, 2, 2, 2, 2, 2, 2, 2, 2, 2];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn l1_required_required() {
+        let nested = vec![
+            // [[0, 1], [], [2, 0, 3], [4, 5, 6], [], [7, 8, 9], [], [10]]
+            Nested::List(ListNested {
+                is_optional: false,
+                offsets: vec![0, 2, 2, 5, 8, 8, 11, 11, 12].try_into().unwrap(),
+                validity: None,
+            }),
+            Nested::Primitive(None, false, 12),
+        ];
+        let expected = vec![1, 1, 0, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn l1_optional_optional() {
+        // [[0, 1], None, [2, None, 3], [4, 5, 6], [], [7, 8, 9], None, [10]]
+
+        let v0 = [true, false, true, true, true, true, false, true];
+        let v1 = [
+            true, true, //[0, 1]
+            true, false, true, //[2, None, 3]
+            true, true, true, //[4, 5, 6]
+            true, true, true, //[7, 8, 9]
+            true, //[10]
+        ];
+        let nested = vec![
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 2, 2, 5, 8, 8, 11, 11, 12].try_into().unwrap(),
+                validity: Some(v0.into()),
+            }),
+            Nested::Primitive(Some(v1.into()), true, 12),
+        ];
+        let expected = vec![3u32, 3, 0, 3, 2, 3, 3, 3, 3, 1, 3, 3, 3, 0, 3];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn l2_required_required_required() {
+        /*
+        [
+            [
+                [1,2,3],
+                [4,5,6,7],
+            ],
+            [
+                [8],
+                [9, 10]
+            ]
+        ]
+        */
+        let nested = vec![
+            Nested::List(ListNested {
+                is_optional: false,
+                offsets: vec![0, 2, 4].try_into().unwrap(),
+                validity: None,
+            }),
+            Nested::List(ListNested {
+                is_optional: false,
+                offsets: vec![0, 3, 7, 8, 10].try_into().unwrap(),
+                validity: None,
+            }),
+            Nested::Primitive(None, false, 10),
+        ];
+        let expected = vec![2, 2, 2, 2, 2, 2, 2, 2, 2, 2];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn l2_optional_required_required() {
+        let a = [true, false, true, true];
+        /*
+        [
+            [
+                [1,2,3],
+                [4,5,6,7],
+            ],
+            None,
+            [
+                [8],
+                [],
+                [9, 10]
+            ]
+        ]
+        */
+        let nested = vec![
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 2, 2, 2, 5].try_into().unwrap(),
+                validity: Some(a.into()),
+            }),
+            Nested::List(ListNested {
+                is_optional: false,
+                offsets: vec![0, 3, 7, 8, 8, 10].try_into().unwrap(),
+                validity: None,
+            }),
+            Nested::Primitive(None, false, 10),
+        ];
+        let expected = vec![3, 3, 3, 3, 3, 3, 3, 0, 1, 3, 2, 3, 3];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn l2_optional_optional_required() {
+        let a = [true, false, true];
+        let b = [true, true, true, true, false];
+        /*
+        [
+            [
+                [1,2,3],
+                [4,5,6,7],
+            ],
+            None,
+            [
+                [8],
+                [],
+                None,
+            ],
+        ]
+        */
+        let nested = vec![
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 2, 2, 5].try_into().unwrap(),
+                validity: Some(a.into()),
+            }),
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 3, 7, 8, 8, 8].try_into().unwrap(),
+                validity: Some(b.into()),
+            }),
+            Nested::Primitive(None, false, 8),
+        ];
+        let expected = vec![4, 4, 4, 4, 4, 4, 4, 0, 4, 3, 2];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn l2_optional_optional_optional() {
+        let a = [true, false, true];
+        let b = [true, true, true, false];
+        let c = [true, true, true, true, false, true, true, true];
+        /*
+        [
+            [
+                [1,2,3],
+                [4,None,6,7],
+            ],
+            None,
+            [
+                [8],
+                None,
+            ],
+        ]
+        */
+        let nested = vec![
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 2, 2, 4].try_into().unwrap(),
+                validity: Some(a.into()),
+            }),
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 3, 7, 8, 8].try_into().unwrap(),
+                validity: Some(b.into()),
+            }),
+            Nested::Primitive(Some(c.into()), true, 8),
+        ];
+        let expected = vec![5, 5, 5, 5, 4, 5, 5, 0, 5, 2];
+
+        test(nested, expected)
+    }
+
+    /*
+        [{"a": "a"}, {"a": "b"}],
+        None,
+        [{"a": "b"}, None, {"a": "b"}],
+        [{"a": None}, {"a": None}, {"a": None}],
+        [],
+        [{"a": "d"}, {"a": "d"}, {"a": "d"}],
+        None,
+        [{"a": "e"}],
+    */
+    #[test]
+    fn nested_list_struct_nullable() {
+        let a = [
+            true, true, true, false, true, false, false, false, true, true, true, true,
+        ];
+        let b = [
+            true, true, true, false, true, true, true, true, true, true, true, true,
+        ];
+        let c = [true, false, true, true, true, true, false, true];
+        let nested = vec![
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 2, 2, 5, 8, 8, 11, 11, 12].try_into().unwrap(),
+                validity: Some(c.into()),
+            }),
+            Nested::Struct(Some(b.into()), true, 12),
+            Nested::Primitive(Some(a.into()), true, 12),
+        ];
+        let expected = vec![4, 4, 0, 4, 2, 4, 3, 3, 3, 1, 4, 4, 4, 0, 4];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn nested_list_struct_nullable1() {
+        let c = [true, false];
+        let nested = vec![
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 1, 1].try_into().unwrap(),
+                validity: Some(c.into()),
+            }),
+            Nested::Struct(None, true, 1),
+            Nested::Primitive(None, true, 1),
+        ];
+        let expected = vec![4, 0];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn nested_struct_list_nullable() {
+        let a = [true, false, true, true, true, true, false, true];
+        let b = [
+            true, true, true, false, true, true, true, true, true, true, true, true,
+        ];
+        let nested = vec![
+            Nested::Struct(None, true, 12),
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 2, 2, 5, 8, 8, 11, 11, 12].try_into().unwrap(),
+                validity: Some(a.into()),
+            }),
+            Nested::Primitive(Some(b.into()), true, 12),
+        ];
+        let expected = vec![4, 4, 1, 4, 3, 4, 4, 4, 4, 2, 4, 4, 4, 1, 4];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn nested_struct_list_nullable1() {
+        let a = [true, true, false];
+        let nested = vec![
+            Nested::Struct(None, true, 3),
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 1, 1, 1].try_into().unwrap(),
+                validity: Some(a.into()),
+            }),
+            Nested::Primitive(None, true, 1),
+        ];
+        let expected = vec![4, 2, 1];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn nested_list_struct_list_nullable1() {
+        /*
+        [
+            [{"a": ["b"]}, None],
+        ]
+        */
+
+        let a = [true];
+        let b = [true, false];
+        let c = [true, false];
+        let d = [true];
+        let nested = vec![
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 2].try_into().unwrap(),
+                validity: Some(a.into()),
+            }),
+            Nested::Struct(Some(b.into()), true, 2),
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 1, 1].try_into().unwrap(),
+                validity: Some(c.into()),
+            }),
+            Nested::Primitive(Some(d.into()), true, 1),
+        ];
+        /*
+                0 6
+                1 6
+                0 0
+                0 6
+                1 2
+        */
+        let expected = vec![6, 2];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn nested_list_struct_list_nullable() {
+        /*
+            [
+            [{"a": ["a"]}, {"a": ["b"]}],
+            None,
+            [{"a": ["b"]}, None, {"a": ["b"]}],
+            [{"a": None}, {"a": None}, {"a": None}],
+            [],
+            [{"a": ["d"]}, {"a": [None]}, {"a": ["c", "d"]}],
+            None,
+            [{"a": []}],
+        ]
+            */
+        let a = [true, false, true, true, true, true, false, true];
+        let b = [
+            true, true, true, false, true, true, true, true, true, true, true, true,
+        ];
+        let c = [
+            true, true, true, false, true, false, false, false, true, true, true, true,
+        ];
+        let d = [true, true, true, true, true, false, true, true];
+        let nested = vec![
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 2, 2, 5, 8, 8, 11, 11, 12].try_into().unwrap(),
+                validity: Some(a.into()),
+            }),
+            Nested::Struct(Some(b.into()), true, 12),
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 1, 2, 3, 3, 4, 4, 4, 4, 5, 6, 8, 8]
+                    .try_into()
+                    .unwrap(),
+                validity: Some(c.into()),
+            }),
+            Nested::Primitive(Some(d.into()), true, 8),
+        ];
+        let expected = vec![6, 6, 0, 6, 2, 6, 3, 3, 3, 1, 6, 5, 6, 6, 0, 4];
+
+        test(nested, expected)
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/write/nested/mod.rs b/crates/nano-arrow/src/io/parquet/write/nested/mod.rs
new file mode 100644
index 000000000000..042d731c57de
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/nested/mod.rs
@@ -0,0 +1,118 @@
+mod def;
+mod rep;
+
+use parquet2::encoding::hybrid_rle::encode_u32;
+use parquet2::read::levels::get_bit_width;
+use parquet2::write::Version;
+pub use rep::num_values;
+
+use super::Nested;
+use crate::error::Result;
+use crate::offset::Offset;
+
+fn write_levels_v1<F: FnOnce(&mut Vec<u8>) -> Result<()>>(
+    buffer: &mut Vec<u8>,
+    encode: F,
+) -> Result<()> {
+    buffer.extend_from_slice(&[0; 4]);
+    let start = buffer.len();
+
+    encode(buffer)?;
+
+    let end = buffer.len();
+    let length = end - start;
+
+    // write the first 4 bytes as length
+    let length = (length as i32).to_le_bytes();
+    (0..4).for_each(|i| buffer[start - 4 + i] = length[i]);
+    Ok(())
+}
+
+/// writes the rep levels to a `Vec<u8>`.
+fn write_rep_levels(buffer: &mut Vec<u8>, nested: &[Nested], version: Version) -> Result<()> {
+    let max_level = max_rep_level(nested) as i16;
+    if max_level == 0 {
+        return Ok(());
+    }
+    let num_bits = get_bit_width(max_level);
+
+    let levels = rep::RepLevelsIter::new(nested);
+
+    match version {
+        Version::V1 => {
+            write_levels_v1(buffer, |buffer: &mut Vec<u8>| {
+                encode_u32(buffer, levels, num_bits)?;
+                Ok(())
+            })?;
+        },
+        Version::V2 => {
+            encode_u32(buffer, levels, num_bits)?;
+        },
+    }
+
+    Ok(())
+}
+
+/// writes the rep levels to a `Vec<u8>`.
+fn write_def_levels(buffer: &mut Vec<u8>, nested: &[Nested], version: Version) -> Result<()> {
+    let max_level = max_def_level(nested) as i16;
+    if max_level == 0 {
+        return Ok(());
+    }
+    let num_bits = get_bit_width(max_level);
+
+    let levels = def::DefLevelsIter::new(nested);
+
+    match version {
+        Version::V1 => write_levels_v1(buffer, move |buffer: &mut Vec<u8>| {
+            encode_u32(buffer, levels, num_bits)?;
+            Ok(())
+        }),
+        Version::V2 => Ok(encode_u32(buffer, levels, num_bits)?),
+    }
+}
+
+fn max_def_level(nested: &[Nested]) -> usize {
+    nested
+        .iter()
+        .map(|nested| match nested {
+            Nested::Primitive(_, is_optional, _) => *is_optional as usize,
+            Nested::List(nested) => 1 + (nested.is_optional as usize),
+            Nested::LargeList(nested) => 1 + (nested.is_optional as usize),
+            Nested::Struct(_, is_optional, _) => *is_optional as usize,
+        })
+        .sum()
+}
+
+fn max_rep_level(nested: &[Nested]) -> usize {
+    nested
+        .iter()
+        .map(|nested| match nested {
+            Nested::LargeList(_) | Nested::List(_) => 1,
+            Nested::Primitive(_, _, _) | Nested::Struct(_, _, _) => 0,
+        })
+        .sum()
+}
+
+fn to_length<O: Offset>(
+    offsets: &[O],
+) -> impl Iterator<Item = usize> + std::fmt::Debug + Clone + '_ {
+    offsets
+        .windows(2)
+        .map(|w| w[1].to_usize() - w[0].to_usize())
+}
+
+/// Write `repetition_levels` and `definition_levels` to buffer.
+pub fn write_rep_and_def(
+    page_version: Version,
+    nested: &[Nested],
+    buffer: &mut Vec<u8>,
+) -> Result<(usize, usize)> {
+    write_rep_levels(buffer, nested, page_version)?;
+    let repetition_levels_byte_length = buffer.len();
+
+    write_def_levels(buffer, nested, page_version)?;
+    let definition_levels_byte_length = buffer.len() - repetition_levels_byte_length;
+
+    Ok((repetition_levels_byte_length, definition_levels_byte_length))
+}
diff --git a/crates/nano-arrow/src/io/parquet/write/nested/rep.rs b/crates/nano-arrow/src/io/parquet/write/nested/rep.rs
new file mode 100644
index 000000000000..2bfbe1ce24f4
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/nested/rep.rs
@@ -0,0 +1,370 @@
+use super::super::pages::Nested;
+use super::to_length;
+
+trait DebugIter: Iterator<Item = usize> + std::fmt::Debug {}
+
+impl<A: Iterator<Item = usize> + std::fmt::Debug> DebugIter for A {}
+
+fn iter<'a>(nested: &'a [Nested]) -> Vec<Box<dyn DebugIter + 'a>> {
+    nested
+        .iter()
+        .filter_map(|nested| match nested {
+            Nested::Primitive(_, _, _) => None,
+            Nested::List(nested) => {
+                Some(Box::new(to_length(&nested.offsets)) as Box<dyn DebugIter>)
+            },
+            Nested::LargeList(nested) => {
+                Some(Box::new(to_length(&nested.offsets)) as Box<dyn DebugIter>)
+            },
+            Nested::Struct(_, _, _) => None,
+        })
+        .collect()
+}
+
+/// return number values of the nested
+pub fn num_values(nested: &[Nested]) -> usize {
+    let pr = match nested.last().unwrap() {
+        Nested::Primitive(_, _, len) => *len,
+        _ => todo!(),
+    };
+
+    iter(nested)
+        .into_iter()
+        .enumerate()
+        .map(|(_, lengths)| {
+            lengths
+                .map(|length| if length == 0 { 1 } else { 0 })
+                .sum::<usize>()
+        })
+        .sum::<usize>()
+        + pr
+}
+
+/// Iterator adapter of parquet / dremel repetition levels
+#[derive(Debug)]
+pub struct RepLevelsIter<'a> {
+    // iterators of lengths. E.g. [[[a,b,c], [d,e,f,g]], [[h], [i,j]]] -> [[2, 2], [3, 4, 1, 2]]
+    iter: Vec<Box<dyn DebugIter + 'a>>,
+    // vector containing the remaining number of values of each iterator.
+    // e.g. the iters [[2, 2], [3, 4, 1, 2]] after the first iteration will return [2, 3],
+    // and remaining will be [2, 3].
+    // on the second iteration, it will be `[2, 2]` (since iterations consume the last items)
+    remaining: Vec<usize>, /* < remaining.len() == iter.len() */
+    // cache of the first `remaining` that is non-zero. Examples:
+    // * `remaining = [2, 2] => current_level = 2`
+    // * `remaining = [2, 0] => current_level = 1`
+    // * `remaining = [0, 0] => current_level = 0`
+    current_level: usize, /* < iter.len() */
+    // the number to discount due to being the first element of the iterators.
+    total: usize, /* < iter.len() */
+
+    // the total number of items that this iterator will return
+    remaining_values: usize,
+}
+
+impl<'a> RepLevelsIter<'a> {
+    pub fn new(nested: &'a [Nested]) -> Self {
+        let remaining_values = num_values(nested);
+
+        let iter = iter(nested);
+        let remaining = vec![0; iter.len()];
+
+        Self {
+            iter,
+            remaining,
+            total: 0,
+            current_level: 0,
+            remaining_values,
+        }
+    }
+}
+
+impl<'a> Iterator for RepLevelsIter<'a> {
+    type Item = u32;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        if self.remaining_values == 0 {
+            return None;
+        }
+        if self.remaining.is_empty() {
+            self.remaining_values -= 1;
+            return Some(0);
+        }
+
+        for (iter, remaining) in self
+            .iter
+            .iter_mut()
+            .zip(self.remaining.iter_mut())
+            .skip(self.current_level)
+        {
+            let length: usize = iter.next()?;
+            *remaining = length;
+            if length == 0 {
+                break;
+            }
+            self.current_level += 1;
+            self.total += 1;
+        }
+
+        // track
+        if let Some(x) = self.remaining.get_mut(self.current_level.saturating_sub(1)) {
+            *x = x.saturating_sub(1)
+        }
+        let r = Some((self.current_level - self.total) as u32);
+
+        // update
+        for index in (1..self.current_level).rev() {
+            if self.remaining[index] == 0 {
+                self.current_level -= 1;
+                self.remaining[index - 1] -= 1;
+            }
+        }
+        if self.remaining[0] == 0 {
+            self.current_level = self.current_level.saturating_sub(1);
+        }
+        self.total = 0;
+        self.remaining_values -= 1;
+
+        r
+    }
+
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        let length = self.remaining_values;
+        (length, Some(length))
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::super::super::pages::ListNested;
+    use super::*;
+
+    fn test(nested: Vec<Nested>, expected: Vec<u32>) {
+        let mut iter = RepLevelsIter::new(&nested);
+        assert_eq!(iter.size_hint().0, expected.len());
+        assert_eq!(iter.by_ref().collect::<Vec<_>>(), expected);
+        assert_eq!(iter.size_hint().0, 0);
+    }
+
+    #[test]
+    fn struct_required() {
+        let nested = vec![
+            Nested::Struct(None, false, 10),
+            Nested::Primitive(None, true, 10),
+        ];
+        let expected = vec![0, 0, 0, 0, 0, 0, 0, 0, 0, 0];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn struct_optional() {
+        let nested = vec![
+            Nested::Struct(None, true, 10),
+            Nested::Primitive(None, true, 10),
+        ];
+        let expected = vec![0, 0, 0, 0, 0, 0, 0, 0, 0, 0];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn l1() {
+        let nested = vec![
+            Nested::List(ListNested {
+                is_optional: false,
+                offsets: vec![0, 2, 2, 5, 8, 8, 11, 11, 12].try_into().unwrap(),
+                validity: None,
+            }),
+            Nested::Primitive(None, false, 12),
+        ];
+        let expected = vec![0u32, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn l2() {
+        let nested = vec![
+            Nested::List(ListNested {
+                is_optional: false,
+                offsets: vec![0, 2, 2, 4].try_into().unwrap(),
+                validity: None,
+            }),
+            Nested::List(ListNested {
+                is_optional: false,
+                offsets: vec![0, 3, 7, 8, 10].try_into().unwrap(),
+                validity: None,
+            }),
+            Nested::Primitive(None, false, 10),
+        ];
+        let expected = vec![0, 2, 2, 1, 2, 2, 2, 0, 0, 1, 2];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn list_of_struct() {
+        /*
+        [
+            [{"a": "b"}],[{"a": "c"}]
+        ]
+        */
+        let nested = vec![
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 1, 2].try_into().unwrap(),
+                validity: None,
+            }),
+            Nested::Struct(None, true, 2),
+            Nested::Primitive(None, true, 2),
+        ];
+        let expected = vec![0, 0];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn list_struct_list() {
+        let nested = vec![
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 2, 3].try_into().unwrap(),
+                validity: None,
+            }),
+            Nested::Struct(None, true, 3),
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 3, 6, 7].try_into().unwrap(),
+                validity: None,
+            }),
+            Nested::Primitive(None, true, 7),
+        ];
+        let expected = vec![0, 2, 2, 1, 2, 2, 0];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn struct_list_optional() {
+        /*
+        {"f1": ["a", "b", None, "c"]}
+        */
+        let nested = vec![
+            Nested::Struct(None, true, 1),
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 4].try_into().unwrap(),
+                validity: None,
+            }),
+            Nested::Primitive(None, true, 4),
+        ];
+        let expected = vec![0, 1, 1, 1];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn l2_other() {
+        let nested = vec![
+            Nested::List(ListNested {
+                is_optional: false,
+                offsets: vec![0, 1, 1, 3, 5, 5, 8, 8, 9].try_into().unwrap(),
+                validity: None,
+            }),
+            Nested::List(ListNested {
+                is_optional: false,
+                offsets: vec![0, 2, 4, 5, 7, 8, 9, 10, 11, 12].try_into().unwrap(),
+                validity: None,
+            }),
+            Nested::Primitive(None, false, 12),
+        ];
+        let expected = vec![0, 2, 0, 0, 2, 1, 0, 2, 1, 0, 0, 1, 1, 0, 0];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn list_struct_list_1() {
+        /*
+        [
+            [{"a": ["a"]}, {"a": ["b"]}],
+            [],
+            [{"a": ["b"]}, None, {"a": ["b"]}],
+            [{"a": []}, {"a": []}, {"a": []}],
+            [],
+            [{"a": ["d"]}, {"a": ["a"]}, {"a": ["c", "d"]}],
+            [],
+            [{"a": []}],
+        ]
+        // reps: [0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 2, 0, 0]
+        */
+        let nested = vec![
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 2, 2, 5, 8, 8, 11, 11, 12].try_into().unwrap(),
+                validity: None,
+            }),
+            Nested::Struct(None, true, 12),
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 1, 2, 3, 3, 4, 4, 4, 4, 5, 6, 8].try_into().unwrap(),
+                validity: None,
+            }),
+            Nested::Primitive(None, true, 8),
+        ];
+        let expected = vec![0, 1, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 2, 0];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn list_struct_list_2() {
+        /*
+        [
+            [{"a": []}],
+        ]
+        // reps: [0]
+        */
+        let nested = vec![
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 1].try_into().unwrap(),
+                validity: None,
+            }),
+            Nested::Struct(None, true, 12),
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 0].try_into().unwrap(),
+                validity: None,
+            }),
+            Nested::Primitive(None, true, 0),
+        ];
+        let expected = vec![0];
+
+        test(nested, expected)
+    }
+
+    #[test]
+    fn list_struct_list_3() {
+        let nested = vec![
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 1, 1].try_into().unwrap(),
+                validity: None,
+            }),
+            Nested::Struct(None, true, 12),
+            Nested::List(ListNested {
+                is_optional: true,
+                offsets: vec![0, 0].try_into().unwrap(),
+                validity: None,
+            }),
+            Nested::Primitive(None, true, 0),
+        ];
+        let expected = vec![0, 0];
+        // [1, 0], [0]
+        // pick last
+
+        test(nested, expected)
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/write/pages.rs b/crates/nano-arrow/src/io/parquet/write/pages.rs
new file mode 100644
index 000000000000..ce51bcdcda89
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/pages.rs
@@ -0,0 +1,633 @@
+use std::fmt::Debug;
+
+use parquet2::page::Page;
+use parquet2::schema::types::{ParquetType, PrimitiveType as ParquetPrimitiveType};
+use parquet2::write::DynIter;
+
+use super::{array_to_pages, Encoding, WriteOptions};
+use crate::array::{Array, ListArray, MapArray, StructArray};
+use crate::bitmap::Bitmap;
+use crate::datatypes::PhysicalType;
+use crate::error::{Error, Result};
+use crate::io::parquet::read::schema::is_nullable;
+use crate::offset::{Offset, OffsetsBuffer};
+
+#[derive(Debug, Clone, PartialEq)]
+pub struct ListNested<O: Offset> {
+    pub is_optional: bool,
+    pub offsets: OffsetsBuffer<O>,
+    pub validity: Option<Bitmap>,
+}
+
+impl<O: Offset> ListNested<O> {
+    pub fn new(offsets: OffsetsBuffer<O>, validity: Option<Bitmap>, is_optional: bool) -> Self {
+        Self {
+            is_optional,
+            offsets,
+            validity,
+        }
+    }
+}
+
+/// Descriptor of nested information of a field
+#[derive(Debug, Clone, PartialEq)]
+pub enum Nested {
+    /// a primitive (leaf or parquet column)
+    /// bitmap, _, length
+    Primitive(Option<Bitmap>, bool, usize),
+    /// a list
+    List(ListNested<i32>),
+    /// a list
+    LargeList(ListNested<i64>),
+    /// a struct
+    Struct(Option<Bitmap>, bool, usize),
+}
+
+impl Nested {
+    /// Returns the length (number of rows) of the element
+    pub fn len(&self) -> usize {
+        match self {
+            Nested::Primitive(_, _, length) => *length,
+            Nested::List(nested) => nested.offsets.len_proxy(),
+            Nested::LargeList(nested) => nested.offsets.len_proxy(),
+            Nested::Struct(_, _, len) => *len,
+        }
+    }
+}
+
+/// Constructs the necessary `Vec<Vec<Nested>>` to write the rep and def levels of `array` to parquet
+pub fn to_nested(array: &dyn Array, type_: &ParquetType) -> Result<Vec<Vec<Nested>>> {
+    let mut nested = vec![];
+
+    to_nested_recursive(array, type_, &mut nested, vec![])?;
+    Ok(nested)
+}
+
+fn to_nested_recursive(
+    array: &dyn Array,
+    type_: &ParquetType,
+    nested: &mut Vec<Vec<Nested>>,
+    mut parents: Vec<Nested>,
+) -> Result<()> {
+    let is_optional = is_nullable(type_.get_field_info());
+
+    use PhysicalType::*;
+    match array.data_type().to_physical_type() {
+        Struct => {
+            let array = array.as_any().downcast_ref::<StructArray>().unwrap();
+            let fields = if let ParquetType::GroupType { fields, .. } = type_ {
+                fields
+            } else {
+                return Err(Error::InvalidArgumentError(
+                    "Parquet type must be a group for a struct array".to_string(),
+                ));
+            };
+
+            parents.push(Nested::Struct(
+                array.validity().cloned(),
+                is_optional,
+                array.len(),
+            ));
+
+            for (type_, array) in fields.iter().zip(array.values()) {
+                to_nested_recursive(array.as_ref(), type_, nested, parents.clone())?;
+            }
+        },
+        List => {
+            let array = array.as_any().downcast_ref::<ListArray<i32>>().unwrap();
+            let type_ = if let ParquetType::GroupType { fields, .. } = type_ {
+                if let ParquetType::GroupType { fields, .. } = &fields[0] {
+                    &fields[0]
+                } else {
+                    return Err(Error::InvalidArgumentError(
+                        "Parquet type must be a group for a list array".to_string(),
+                    ));
+                }
+            } else {
+                return Err(Error::InvalidArgumentError(
+                    "Parquet type must be a group for a list array".to_string(),
+                ));
+            };
+
+            parents.push(Nested::List(ListNested::new(
+                array.offsets().clone(),
+                array.validity().cloned(),
+                is_optional,
+            )));
+            to_nested_recursive(array.values().as_ref(), type_, nested, parents)?;
+        },
+        LargeList => {
+            let array = array.as_any().downcast_ref::<ListArray<i64>>().unwrap();
+            let type_ = if let ParquetType::GroupType { fields, .. } = type_ {
+                if let ParquetType::GroupType { fields, .. } = &fields[0] {
+                    &fields[0]
+                } else {
+                    return Err(Error::InvalidArgumentError(
+                        "Parquet type must be a group for a list array".to_string(),
+                    ));
+                }
+            } else {
+                return Err(Error::InvalidArgumentError(
+                    "Parquet type must be a group for a list array".to_string(),
+                ));
+            };
+
+            parents.push(Nested::LargeList(ListNested::new(
+                array.offsets().clone(),
+                array.validity().cloned(),
+                is_optional,
+            )));
+            to_nested_recursive(array.values().as_ref(), type_, nested, parents)?;
+        },
+        Map => {
+            let array = array.as_any().downcast_ref::<MapArray>().unwrap();
+            let type_ = if let ParquetType::GroupType { fields, .. } = type_ {
+                if let ParquetType::GroupType { fields, .. } = &fields[0] {
+                    &fields[0]
+                } else {
+                    return Err(Error::InvalidArgumentError(
+                        "Parquet type must be a group for a map array".to_string(),
+                    ));
+                }
+            } else {
+                return Err(Error::InvalidArgumentError(
+                    "Parquet type must be a group for a map array".to_string(),
+                ));
+            };
+
+            parents.push(Nested::List(ListNested::new(
+                array.offsets().clone(),
+                array.validity().cloned(),
+                is_optional,
+            )));
+            to_nested_recursive(array.field().as_ref(), type_, nested, parents)?;
+        },
+        _ => {
+            parents.push(Nested::Primitive(
+                array.validity().cloned(),
+                is_optional,
+                array.len(),
+            ));
+            nested.push(parents)
+        },
+    }
+    Ok(())
+}
+
+/// Convert [`Array`] to `Vec<&dyn Array>` leaves in DFS order.
+pub fn to_leaves(array: &dyn Array) -> Vec<&dyn Array> {
+    let mut leaves = vec![];
+    to_leaves_recursive(array, &mut leaves);
+    leaves
+}
+
+fn to_leaves_recursive<'a>(array: &'a dyn Array, leaves: &mut Vec<&'a dyn Array>) {
+    use PhysicalType::*;
+    match array.data_type().to_physical_type() {
+        Struct => {
+            let array = array.as_any().downcast_ref::<StructArray>().unwrap();
+            array
+                .values()
+                .iter()
+                .for_each(|a| to_leaves_recursive(a.as_ref(), leaves));
+        },
+        List => {
+            let array = array.as_any().downcast_ref::<ListArray<i32>>().unwrap();
+            to_leaves_recursive(array.values().as_ref(), leaves);
+        },
+        LargeList => {
+            let array = array.as_any().downcast_ref::<ListArray<i64>>().unwrap();
+            to_leaves_recursive(array.values().as_ref(), leaves);
+        },
+        Map => {
+            let array = array.as_any().downcast_ref::<MapArray>().unwrap();
+            to_leaves_recursive(array.field().as_ref(), leaves);
+        },
+        Null | Boolean | Primitive(_) | Binary | FixedSizeBinary | LargeBinary | Utf8
+        | LargeUtf8 | Dictionary(_) => leaves.push(array),
+        other => todo!("Writing {:?} to parquet not yet implemented", other),
+    }
+}
+
+/// Convert `ParquetType` to `Vec<ParquetPrimitiveType>` leaves in DFS order.
+pub fn to_parquet_leaves(type_: ParquetType) -> Vec<ParquetPrimitiveType> {
+    let mut leaves = vec![];
+    to_parquet_leaves_recursive(type_, &mut leaves);
+    leaves
+}
+
+fn to_parquet_leaves_recursive(type_: ParquetType, leaves: &mut Vec<ParquetPrimitiveType>) {
+    match type_ {
+        ParquetType::PrimitiveType(primitive) => leaves.push(primitive),
+        ParquetType::GroupType { fields, .. } => {
+            fields
+                .into_iter()
+                .for_each(|type_| to_parquet_leaves_recursive(type_, leaves));
+        },
+    }
+}
+
+/// Returns a vector of iterators of [`Page`], one per leaf column in the array
+pub fn array_to_columns<A: AsRef<dyn Array> + Send + Sync>(
+    array: A,
+    type_: ParquetType,
+    options: WriteOptions,
+    encoding: &[Encoding],
+) -> Result<Vec<DynIter<'static, Result<Page>>>> {
+    let array = array.as_ref();
+    let nested = to_nested(array, &type_)?;
+
+    let types = to_parquet_leaves(type_);
+
+    let values = to_leaves(array);
+
+    assert_eq!(encoding.len(), types.len());
+
+    values
+        .iter()
+        .zip(nested)
+        .zip(types)
+        .zip(encoding.iter())
+        .map(|(((values, nested), type_), encoding)| {
+            array_to_pages(*values, type_, &nested, options, *encoding)
+        })
+        .collect()
+}
+
+#[cfg(test)]
+mod tests {
+    use parquet2::schema::types::{GroupLogicalType, PrimitiveConvertedType, PrimitiveLogicalType};
+    use parquet2::schema::Repetition;
+
+    use super::super::{FieldInfo, ParquetPhysicalType, ParquetPrimitiveType};
+    use super::*;
+    use crate::array::*;
+    use crate::bitmap::Bitmap;
+    use crate::datatypes::*;
+
+    #[test]
+    fn test_struct() {
+        let boolean = BooleanArray::from_slice([false, false, true, true]).boxed();
+        let int = Int32Array::from_slice([42, 28, 19, 31]).boxed();
+
+        let fields = vec![
+            Field::new("b", DataType::Boolean, false),
+            Field::new("c", DataType::Int32, false),
+        ];
+
+        let array = StructArray::new(
+            DataType::Struct(fields),
+            vec![boolean.clone(), int.clone()],
+            Some(Bitmap::from([true, true, false, true])),
+        );
+
+        let type_ = ParquetType::GroupType {
+            field_info: FieldInfo {
+                name: "a".to_string(),
+                repetition: Repetition::Optional,
+                id: None,
+            },
+            logical_type: None,
+            converted_type: None,
+            fields: vec![
+                ParquetType::PrimitiveType(ParquetPrimitiveType {
+                    field_info: FieldInfo {
+                        name: "b".to_string(),
+                        repetition: Repetition::Required,
+                        id: None,
+                    },
+                    logical_type: None,
+                    converted_type: None,
+                    physical_type: ParquetPhysicalType::Boolean,
+                }),
+                ParquetType::PrimitiveType(ParquetPrimitiveType {
+                    field_info: FieldInfo {
+                        name: "c".to_string(),
+                        repetition: Repetition::Required,
+                        id: None,
+                    },
+                    logical_type: None,
+                    converted_type: None,
+                    physical_type: ParquetPhysicalType::Int32,
+                }),
+            ],
+        };
+        let a = to_nested(&array, &type_).unwrap();
+
+        assert_eq!(
+            a,
+            vec![
+                vec![
+                    Nested::Struct(Some(Bitmap::from([true, true, false, true])), true, 4),
+                    Nested::Primitive(None, false, 4),
+                ],
+                vec![
+                    Nested::Struct(Some(Bitmap::from([true, true, false, true])), true, 4),
+                    Nested::Primitive(None, false, 4),
+                ],
+            ]
+        );
+    }
+
+    #[test]
+    fn test_struct_struct() {
+        let boolean = BooleanArray::from_slice([false, false, true, true]).boxed();
+        let int = Int32Array::from_slice([42, 28, 19, 31]).boxed();
+
+        let fields = vec![
+            Field::new("b", DataType::Boolean, false),
+            Field::new("c", DataType::Int32, false),
+        ];
+
+        let array = StructArray::new(
+            DataType::Struct(fields),
+            vec![boolean.clone(), int.clone()],
+            Some(Bitmap::from([true, true, false, true])),
+        );
+
+        let fields = vec![
+            Field::new("b", array.data_type().clone(), true),
+            Field::new("c", array.data_type().clone(), true),
+        ];
+
+        let array = StructArray::new(
+            DataType::Struct(fields),
+            vec![Box::new(array.clone()), Box::new(array)],
+            None,
+        );
+
+        let type_ = ParquetType::GroupType {
+            field_info: FieldInfo {
+                name: "a".to_string(),
+                repetition: Repetition::Optional,
+                id: None,
+            },
+            logical_type: None,
+            converted_type: None,
+            fields: vec![
+                ParquetType::PrimitiveType(ParquetPrimitiveType {
+                    field_info: FieldInfo {
+                        name: "b".to_string(),
+                        repetition: Repetition::Required,
+                        id: None,
+                    },
+                    logical_type: None,
+                    converted_type: None,
+                    physical_type: ParquetPhysicalType::Boolean,
+                }),
+                ParquetType::PrimitiveType(ParquetPrimitiveType {
+                    field_info: FieldInfo {
+                        name: "c".to_string(),
+                        repetition: Repetition::Required,
+                        id: None,
+                    },
+                    logical_type: None,
+                    converted_type: None,
+                    physical_type: ParquetPhysicalType::Int32,
+                }),
+            ],
+        };
+
+        let type_ = ParquetType::GroupType {
+            field_info: FieldInfo {
+                name: "a".to_string(),
+                repetition: Repetition::Required,
+                id: None,
+            },
+            logical_type: None,
+            converted_type: None,
+            fields: vec![type_.clone(), type_],
+        };
+
+        let a = to_nested(&array, &type_).unwrap();
+
+        assert_eq!(
+            a,
+            vec![
+                // a.b.b
+                vec![
+                    Nested::Struct(None, false, 4),
+                    Nested::Struct(Some(Bitmap::from([true, true, false, true])), true, 4),
+                    Nested::Primitive(None, false, 4),
+                ],
+                // a.b.c
+                vec![
+                    Nested::Struct(None, false, 4),
+                    Nested::Struct(Some(Bitmap::from([true, true, false, true])), true, 4),
+                    Nested::Primitive(None, false, 4),
+                ],
+                // a.c.b
+                vec![
+                    Nested::Struct(None, false, 4),
+                    Nested::Struct(Some(Bitmap::from([true, true, false, true])), true, 4),
+                    Nested::Primitive(None, false, 4),
+                ],
+                // a.c.c
+                vec![
+                    Nested::Struct(None, false, 4),
+                    Nested::Struct(Some(Bitmap::from([true, true, false, true])), true, 4),
+                    Nested::Primitive(None, false, 4),
+                ],
+            ]
+        );
+    }
+
+    #[test]
+    fn test_list_struct() {
+        let boolean = BooleanArray::from_slice([false, false, true, true]).boxed();
+        let int = Int32Array::from_slice([42, 28, 19, 31]).boxed();
+
+        let fields = vec![
+            Field::new("b", DataType::Boolean, false),
+            Field::new("c", DataType::Int32, false),
+        ];
+
+        let array = StructArray::new(
+            DataType::Struct(fields),
+            vec![boolean.clone(), int.clone()],
+            Some(Bitmap::from([true, true, false, true])),
+        );
+
+        let array = ListArray::new(
+            DataType::List(Box::new(Field::new("l", array.data_type().clone(), true))),
+            vec![0i32, 2, 4].try_into().unwrap(),
+            Box::new(array),
+            None,
+        );
+
+        let type_ = ParquetType::GroupType {
+            field_info: FieldInfo {
+                name: "a".to_string(),
+                repetition: Repetition::Optional,
+                id: None,
+            },
+            logical_type: None,
+            converted_type: None,
+            fields: vec![
+                ParquetType::PrimitiveType(ParquetPrimitiveType {
+                    field_info: FieldInfo {
+                        name: "b".to_string(),
+                        repetition: Repetition::Required,
+                        id: None,
+                    },
+                    logical_type: None,
+                    converted_type: None,
+                    physical_type: ParquetPhysicalType::Boolean,
+                }),
+                ParquetType::PrimitiveType(ParquetPrimitiveType {
+                    field_info: FieldInfo {
+                        name: "c".to_string(),
+                        repetition: Repetition::Required,
+                        id: None,
+                    },
+                    logical_type: None,
+                    converted_type: None,
+                    physical_type: ParquetPhysicalType::Int32,
+                }),
+            ],
+        };
+
+        let type_ = ParquetType::GroupType {
+            field_info: FieldInfo {
+                name: "l".to_string(),
+                repetition: Repetition::Required,
+                id: None,
+            },
+            logical_type: None,
+            converted_type: None,
+            fields: vec![ParquetType::GroupType {
+                field_info: FieldInfo {
+                    name: "list".to_string(),
+                    repetition: Repetition::Repeated,
+                    id: None,
+                },
+                logical_type: None,
+                converted_type: None,
+                fields: vec![type_],
+            }],
+        };
+
+        let a = to_nested(&array, &type_).unwrap();
+
+        assert_eq!(
+            a,
+            vec![
+                vec![
+                    Nested::List(ListNested::<i32> {
+                        is_optional: false,
+                        offsets: vec![0, 2, 4].try_into().unwrap(),
+                        validity: None,
+                    }),
+                    Nested::Struct(Some(Bitmap::from([true, true, false, true])), true, 4),
+                    Nested::Primitive(None, false, 4),
+                ],
+                vec![
+                    Nested::List(ListNested::<i32> {
+                        is_optional: false,
+                        offsets: vec![0, 2, 4].try_into().unwrap(),
+                        validity: None,
+                    }),
+                    Nested::Struct(Some(Bitmap::from([true, true, false, true])), true, 4),
+                    Nested::Primitive(None, false, 4),
+                ],
+            ]
+        );
+    }
+
+    #[test]
+    fn test_map() {
+        let kv_type = DataType::Struct(vec![
+            Field::new("k", DataType::Utf8, false),
+            Field::new("v", DataType::Int32, false),
+        ]);
+        let kv_field = Field::new("kv", kv_type.clone(), false);
+        let map_type = DataType::Map(Box::new(kv_field), false);
+
+        let key_array = Utf8Array::<i32>::from_slice(["k1", "k2", "k3", "k4", "k5", "k6"]).boxed();
+        let val_array = Int32Array::from_slice([42, 28, 19, 31, 21, 17]).boxed();
+        let kv_array = StructArray::try_new(kv_type, vec![key_array, val_array], None)
+            .unwrap()
+            .boxed();
+        let offsets = OffsetsBuffer::try_from(vec![0, 2, 3, 4, 6]).unwrap();
+
+        let array = MapArray::try_new(map_type, offsets, kv_array, None).unwrap();
+
+        let type_ = ParquetType::GroupType {
+            field_info: FieldInfo {
+                name: "kv".to_string(),
+                repetition: Repetition::Optional,
+                id: None,
+            },
+            logical_type: None,
+            converted_type: None,
+            fields: vec![
+                ParquetType::PrimitiveType(ParquetPrimitiveType {
+                    field_info: FieldInfo {
+                        name: "k".to_string(),
+                        repetition: Repetition::Required,
+                        id: None,
+                    },
+                    logical_type: Some(PrimitiveLogicalType::String),
+                    converted_type: Some(PrimitiveConvertedType::Utf8),
+                    physical_type: ParquetPhysicalType::ByteArray,
+                }),
+                ParquetType::PrimitiveType(ParquetPrimitiveType {
+                    field_info: FieldInfo {
+                        name: "v".to_string(),
+                        repetition: Repetition::Required,
+                        id: None,
+                    },
+                    logical_type: None,
+                    converted_type: None,
+                    physical_type: ParquetPhysicalType::Int32,
+                }),
+            ],
+        };
+
+        let type_ = ParquetType::GroupType {
+            field_info: FieldInfo {
+                name: "m".to_string(),
+                repetition: Repetition::Required,
+                id: None,
+            },
+            logical_type: Some(GroupLogicalType::Map),
+            converted_type: None,
+            fields: vec![ParquetType::GroupType {
+                field_info: FieldInfo {
+                    name: "map".to_string(),
+                    repetition: Repetition::Repeated,
+                    id: None,
+                },
+                logical_type: None,
+                converted_type: None,
+                fields: vec![type_],
+            }],
+        };
+
+        let a = to_nested(&array, &type_).unwrap();
+
+        assert_eq!(
+            a,
+            vec![
+                vec![
+                    Nested::List(ListNested::<i32> {
+                        is_optional: false,
+                        offsets: vec![0, 2, 3, 4, 6].try_into().unwrap(),
+                        validity: None,
+                    }),
+                    Nested::Struct(None, true, 6),
+                    Nested::Primitive(None, false, 6),
+                ],
+                vec![
+                    Nested::List(ListNested::<i32> {
+                        is_optional: false,
+                        offsets: vec![0, 2, 3, 4, 6].try_into().unwrap(),
+                        validity: None,
+                    }),
+                    Nested::Struct(None, true, 6),
+                    Nested::Primitive(None, false, 6),
+                ],
+            ]
+        );
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/write/primitive/basic.rs b/crates/nano-arrow/src/io/parquet/write/primitive/basic.rs
new file mode 100644
index 000000000000..14d5f9077b49
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/primitive/basic.rs
@@ -0,0 +1,192 @@
+use parquet2::encoding::delta_bitpacked::encode;
+use parquet2::encoding::Encoding;
+use parquet2::page::DataPage;
+use parquet2::schema::types::PrimitiveType;
+use parquet2::statistics::{serialize_statistics, PrimitiveStatistics};
+use parquet2::types::NativeType as ParquetNativeType;
+
+use super::super::{utils, WriteOptions};
+use crate::array::{Array, PrimitiveArray};
+use crate::error::Error;
+use crate::io::parquet::read::schema::is_nullable;
+use crate::io::parquet::write::utils::ExactSizedIter;
+use crate::types::NativeType;
+
+pub(crate) fn encode_plain<T, P>(
+    array: &PrimitiveArray<T>,
+    is_optional: bool,
+    mut buffer: Vec<u8>,
+) -> Vec<u8>
+where
+    T: NativeType,
+    P: ParquetNativeType,
+    T: num_traits::AsPrimitive<P>,
+{
+    if is_optional {
+        buffer.reserve(std::mem::size_of::<P>() * (array.len() - array.null_count()));
+        // append the non-null values
+        array.iter().for_each(|x| {
+            if let Some(x) = x {
+                let parquet_native: P = x.as_();
+                buffer.extend_from_slice(parquet_native.to_le_bytes().as_ref())
+            }
+        });
+    } else {
+        buffer.reserve(std::mem::size_of::<P>() * array.len());
+        // append all values
+        array.values().iter().for_each(|x| {
+            let parquet_native: P = x.as_();
+            buffer.extend_from_slice(parquet_native.to_le_bytes().as_ref())
+        });
+    }
+    buffer
+}
+
+pub(crate) fn encode_delta<T, P>(
+    array: &PrimitiveArray<T>,
+    is_optional: bool,
+    mut buffer: Vec<u8>,
+) -> Vec<u8>
+where
+    T: NativeType,
+    P: ParquetNativeType,
+    T: num_traits::AsPrimitive<P>,
+    P: num_traits::AsPrimitive<i64>,
+{
+    if is_optional {
+        // append the non-null values
+        let iterator = array.iter().flatten().map(|x| {
+            let parquet_native: P = x.as_();
+            let integer: i64 = parquet_native.as_();
+            integer
+        });
+        let iterator = ExactSizedIter::new(iterator, array.len() - array.null_count());
+        encode(iterator, &mut buffer)
+    } else {
+        // append all values
+        let iterator = array.values().iter().map(|x| {
+            let parquet_native: P = x.as_();
+            let integer: i64 = parquet_native.as_();
+            integer
+        });
+        encode(iterator, &mut buffer)
+    }
+    buffer
+}
+
+pub fn array_to_page_plain<T, P>(
+    array: &PrimitiveArray<T>,
+    options: WriteOptions,
+    type_: PrimitiveType,
+) -> Result<DataPage, Error>
+where
+    T: NativeType,
+    P: ParquetNativeType,
+    T: num_traits::AsPrimitive<P>,
+{
+    array_to_page(array, options, type_, Encoding::Plain, encode_plain)
+}
+
+pub fn array_to_page_integer<T, P>(
+    array: &PrimitiveArray<T>,
+    options: WriteOptions,
+    type_: PrimitiveType,
+    encoding: Encoding,
+) -> Result<DataPage, Error>
+where
+    T: NativeType,
+    P: ParquetNativeType,
+    T: num_traits::AsPrimitive<P>,
+    P: num_traits::AsPrimitive<i64>,
+{
+    match encoding {
+        Encoding::DeltaBinaryPacked => array_to_page(array, options, type_, encoding, encode_delta),
+        Encoding::Plain => array_to_page(array, options, type_, encoding, encode_plain),
+        other => Err(Error::nyi(format!("Encoding integer as {other:?}"))),
+    }
+}
+
+pub fn array_to_page<T, P, F: Fn(&PrimitiveArray<T>, bool, Vec<u8>) -> Vec<u8>>(
+    array: &PrimitiveArray<T>,
+    options: WriteOptions,
+    type_: PrimitiveType,
+    encoding: Encoding,
+    encode: F,
+) -> Result<DataPage, Error>
+where
+    T: NativeType,
+    P: ParquetNativeType,
+    // constraint required to build statistics
+    T: num_traits::AsPrimitive<P>,
+{
+    let is_optional = is_nullable(&type_.field_info);
+
+    let validity = array.validity();
+
+    let mut buffer = vec![];
+    utils::write_def_levels(
+        &mut buffer,
+        is_optional,
+        validity,
+        array.len(),
+        options.version,
+    )?;
+
+    let definition_levels_byte_length = buffer.len();
+
+    let buffer = encode(array, is_optional, buffer);
+
+    let statistics = if options.write_statistics {
+        Some(serialize_statistics(&build_statistics(
+            array,
+            type_.clone(),
+        )))
+    } else {
+        None
+    };
+
+    utils::build_plain_page(
+        buffer,
+        array.len(),
+        array.len(),
+        array.null_count(),
+        0,
+        definition_levels_byte_length,
+        statistics,
+        type_,
+        options,
+        encoding,
+    )
+}
+
+pub fn build_statistics<T, P>(
+    array: &PrimitiveArray<T>,
+    primitive_type: PrimitiveType,
+) -> PrimitiveStatistics<P>
+where
+    T: NativeType,
+    P: ParquetNativeType,
+    T: num_traits::AsPrimitive<P>,
+{
+    PrimitiveStatistics::<P> {
+        primitive_type,
+        null_count: Some(array.null_count() as i64),
+        distinct_count: None,
+        max_value: array
+            .iter()
+            .flatten()
+            .map(|x| {
+                let x: P = x.as_();
+                x
+            })
+            .max_by(|x, y| x.ord(y)),
+        min_value: array
+            .iter()
+            .flatten()
+            .map(|x| {
+                let x: P = x.as_();
+                x
+            })
+            .min_by(|x, y| x.ord(y)),
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/write/primitive/mod.rs b/crates/nano-arrow/src/io/parquet/write/primitive/mod.rs
new file mode 100644
index 000000000000..96318ab0a89b
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/primitive/mod.rs
@@ -0,0 +1,6 @@
+mod basic;
+mod nested;
+
+pub use basic::{array_to_page_integer, array_to_page_plain};
+pub(crate) use basic::{build_statistics, encode_plain};
+pub use nested::array_to_page as nested_array_to_page;
diff --git a/crates/nano-arrow/src/io/parquet/write/primitive/nested.rs b/crates/nano-arrow/src/io/parquet/write/primitive/nested.rs
new file mode 100644
index 000000000000..fe859013c96b
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/primitive/nested.rs
@@ -0,0 +1,56 @@
+use parquet2::encoding::Encoding;
+use parquet2::page::DataPage;
+use parquet2::schema::types::PrimitiveType;
+use parquet2::statistics::serialize_statistics;
+use parquet2::types::NativeType;
+
+use super::super::{nested, utils, WriteOptions};
+use super::basic::{build_statistics, encode_plain};
+use crate::array::{Array, PrimitiveArray};
+use crate::error::Result;
+use crate::io::parquet::read::schema::is_nullable;
+use crate::io::parquet::write::Nested;
+use crate::types::NativeType as ArrowNativeType;
+
+pub fn array_to_page<T, R>(
+    array: &PrimitiveArray<T>,
+    options: WriteOptions,
+    type_: PrimitiveType,
+    nested: &[Nested],
+) -> Result<DataPage>
+where
+    T: ArrowNativeType,
+    R: NativeType,
+    T: num_traits::AsPrimitive<R>,
+{
+    let is_optional = is_nullable(&type_.field_info);
+
+    let mut buffer = vec![];
+
+    let (repetition_levels_byte_length, definition_levels_byte_length) =
+        nested::write_rep_and_def(options.version, nested, &mut buffer)?;
+
+    let buffer = encode_plain(array, is_optional, buffer);
+
+    let statistics = if options.write_statistics {
+        Some(serialize_statistics(&build_statistics(
+            array,
+            type_.clone(),
+        )))
+    } else {
+        None
+    };
+
+    utils::build_plain_page(
+        buffer,
+        nested::num_values(nested),
+        nested[0].len(),
+        array.null_count(),
+        repetition_levels_byte_length,
+        definition_levels_byte_length,
+        statistics,
+        type_,
+        options,
+        Encoding::Plain,
+    )
+}
diff --git a/crates/nano-arrow/src/io/parquet/write/row_group.rs b/crates/nano-arrow/src/io/parquet/write/row_group.rs
new file mode 100644
index 000000000000..d281b63cebda
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/row_group.rs
@@ -0,0 +1,126 @@
+use parquet2::error::Error as ParquetError;
+use parquet2::schema::types::ParquetType;
+use parquet2::write::Compressor;
+use parquet2::FallibleStreamingIterator;
+
+use super::{
+    array_to_columns, to_parquet_schema, DynIter, DynStreamingIterator, Encoding, RowGroupIter,
+    SchemaDescriptor, WriteOptions,
+};
+use crate::array::Array;
+use crate::chunk::Chunk;
+use crate::datatypes::Schema;
+use crate::error::{Error, Result};
+
+/// Maps a [`Chunk`] and parquet-specific options to an [`RowGroupIter`] used to
+/// write to parquet
+/// # Panics
+/// Iff
+/// * `encodings.len() != fields.len()` or
+/// * `encodings.len() != chunk.arrays().len()`
+pub fn row_group_iter<A: AsRef<dyn Array> + 'static + Send + Sync>(
+    chunk: Chunk<A>,
+    encodings: Vec<Vec<Encoding>>,
+    fields: Vec<ParquetType>,
+    options: WriteOptions,
+) -> RowGroupIter<'static, Error> {
+    assert_eq!(encodings.len(), fields.len());
+    assert_eq!(encodings.len(), chunk.arrays().len());
+    DynIter::new(
+        chunk
+            .into_arrays()
+            .into_iter()
+            .zip(fields)
+            .zip(encodings)
+            .flat_map(move |((array, type_), encoding)| {
+                let encoded_columns = array_to_columns(array, type_, options, &encoding).unwrap();
+                encoded_columns
+                    .into_iter()
+                    .map(|encoded_pages| {
+                        let pages = encoded_pages;
+
+                        let pages = DynIter::new(
+                            pages
+                                .into_iter()
+                                .map(|x| x.map_err(|e| ParquetError::OutOfSpec(e.to_string()))),
+                        );
+
+                        let compressed_pages = Compressor::new(pages, options.compression, vec![])
+                            .map_err(Error::from);
+                        Ok(DynStreamingIterator::new(compressed_pages))
+                    })
+                    .collect::<Vec<_>>()
+            }),
+    )
+}
+
+/// An iterator adapter that converts an iterator over [`Chunk`] into an iterator
+/// of row groups.
+/// Use it to create an iterator consumable by the parquet's API.
+pub struct RowGroupIterator<A: AsRef<dyn Array> + 'static, I: Iterator<Item = Result<Chunk<A>>>> {
+    iter: I,
+    options: WriteOptions,
+    parquet_schema: SchemaDescriptor,
+    encodings: Vec<Vec<Encoding>>,
+}
+
+impl<A: AsRef<dyn Array> + 'static, I: Iterator<Item = Result<Chunk<A>>>> RowGroupIterator<A, I> {
+    /// Creates a new [`RowGroupIterator`] from an iterator over [`Chunk`].
+    ///
+    /// # Errors
+    /// Iff
+    /// * the Arrow schema can't be converted to a valid Parquet schema.
+    /// * the length of the encodings is different from the number of fields in schema
+    pub fn try_new(
+        iter: I,
+        schema: &Schema,
+        options: WriteOptions,
+        encodings: Vec<Vec<Encoding>>,
+    ) -> Result<Self> {
+        if encodings.len() != schema.fields.len() {
+            return Err(Error::InvalidArgumentError(
+                "The number of encodings must equal the number of fields".to_string(),
+            ));
+        }
+        let parquet_schema = to_parquet_schema(schema)?;
+
+        Ok(Self {
+            iter,
+            options,
+            parquet_schema,
+            encodings,
+        })
+    }
+
+    /// Returns the [`SchemaDescriptor`] of the [`RowGroupIterator`].
+    pub fn parquet_schema(&self) -> &SchemaDescriptor {
+        &self.parquet_schema
+    }
+}
+
+impl<A: AsRef<dyn Array> + 'static + Send + Sync, I: Iterator<Item = Result<Chunk<A>>>> Iterator
+    for RowGroupIterator<A, I>
+{
+    type Item = Result<RowGroupIter<'static, Error>>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        let options = self.options;
+
+        self.iter.next().map(|maybe_chunk| {
+            let chunk = maybe_chunk?;
+            if self.encodings.len() != chunk.arrays().len() {
+                return Err(Error::InvalidArgumentError(
+                    "The number of arrays in the chunk must equal the number of fields in the schema"
+                        .to_string(),
+                ));
+            };
+            let encodings = self.encodings.clone();
+            Ok(row_group_iter(
+                chunk,
+                encodings,
+                self.parquet_schema.fields().to_vec(),
+                options,
+            ))
+        })
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/write/schema.rs b/crates/nano-arrow/src/io/parquet/write/schema.rs
new file mode 100644
index 000000000000..6f3ade5d46b3
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/schema.rs
@@ -0,0 +1,379 @@
+use base64::engine::general_purpose;
+use base64::Engine as _;
+use parquet2::metadata::KeyValue;
+use parquet2::schema::types::{
+    GroupConvertedType, GroupLogicalType, IntegerType, ParquetType, PhysicalType,
+    PrimitiveConvertedType, PrimitiveLogicalType, TimeUnit as ParquetTimeUnit,
+};
+use parquet2::schema::Repetition;
+
+use super::super::ARROW_SCHEMA_META_KEY;
+use crate::datatypes::{DataType, Field, Schema, TimeUnit};
+use crate::error::{Error, Result};
+use crate::io::ipc::write::{default_ipc_fields, schema_to_bytes};
+use crate::io::parquet::write::decimal_length_from_precision;
+
+pub fn schema_to_metadata_key(schema: &Schema) -> KeyValue {
+    let serialized_schema = schema_to_bytes(schema, &default_ipc_fields(&schema.fields));
+
+    // manually prepending the length to the schema as arrow uses the legacy IPC format
+    // TODO: change after addressing ARROW-9777
+    let schema_len = serialized_schema.len();
+    let mut len_prefix_schema = Vec::with_capacity(schema_len + 8);
+    len_prefix_schema.extend_from_slice(&[255u8, 255, 255, 255]);
+    len_prefix_schema.extend_from_slice(&(schema_len as u32).to_le_bytes());
+    len_prefix_schema.extend_from_slice(&serialized_schema);
+
+    let encoded = general_purpose::STANDARD.encode(&len_prefix_schema);
+
+    KeyValue {
+        key: ARROW_SCHEMA_META_KEY.to_string(),
+        value: Some(encoded),
+    }
+}
+
+/// Creates a [`ParquetType`] from a [`Field`].
+pub fn to_parquet_type(field: &Field) -> Result<ParquetType> {
+    let name = field.name.clone();
+    let repetition = if field.is_nullable {
+        Repetition::Optional
+    } else {
+        Repetition::Required
+    };
+    // create type from field
+    match field.data_type().to_logical_type() {
+        DataType::Null => Ok(ParquetType::try_from_primitive(
+            name,
+            PhysicalType::Int32,
+            repetition,
+            None,
+            Some(PrimitiveLogicalType::Unknown),
+            None,
+        )?),
+        DataType::Boolean => Ok(ParquetType::try_from_primitive(
+            name,
+            PhysicalType::Boolean,
+            repetition,
+            None,
+            None,
+            None,
+        )?),
+        DataType::Int32 => Ok(ParquetType::try_from_primitive(
+            name,
+            PhysicalType::Int32,
+            repetition,
+            None,
+            None,
+            None,
+        )?),
+        // DataType::Duration(_) has no parquet representation => do not apply any logical type
+        DataType::Int64 | DataType::Duration(_) => Ok(ParquetType::try_from_primitive(
+            name,
+            PhysicalType::Int64,
+            repetition,
+            None,
+            None,
+            None,
+        )?),
+        // no natural representation in parquet; leave it as is.
+        // arrow consumers MAY use the arrow schema in the metadata to parse them.
+        DataType::Date64 => Ok(ParquetType::try_from_primitive(
+            name,
+            PhysicalType::Int64,
+            repetition,
+            None,
+            None,
+            None,
+        )?),
+        DataType::Float32 => Ok(ParquetType::try_from_primitive(
+            name,
+            PhysicalType::Float,
+            repetition,
+            None,
+            None,
+            None,
+        )?),
+        DataType::Float64 => Ok(ParquetType::try_from_primitive(
+            name,
+            PhysicalType::Double,
+            repetition,
+            None,
+            None,
+            None,
+        )?),
+        DataType::Binary | DataType::LargeBinary => Ok(ParquetType::try_from_primitive(
+            name,
+            PhysicalType::ByteArray,
+            repetition,
+            None,
+            None,
+            None,
+        )?),
+        DataType::Utf8 | DataType::LargeUtf8 => Ok(ParquetType::try_from_primitive(
+            name,
+            PhysicalType::ByteArray,
+            repetition,
+            Some(PrimitiveConvertedType::Utf8),
+            Some(PrimitiveLogicalType::String),
+            None,
+        )?),
+        DataType::Date32 => Ok(ParquetType::try_from_primitive(
+            name,
+            PhysicalType::Int32,
+            repetition,
+            Some(PrimitiveConvertedType::Date),
+            Some(PrimitiveLogicalType::Date),
+            None,
+        )?),
+        DataType::Int8 => Ok(ParquetType::try_from_primitive(
+            name,
+            PhysicalType::Int32,
+            repetition,
+            Some(PrimitiveConvertedType::Int8),
+            Some(PrimitiveLogicalType::Integer(IntegerType::Int8)),
+            None,
+        )?),
+        DataType::Int16 => Ok(ParquetType::try_from_primitive(
+            name,
+            PhysicalType::Int32,
+            repetition,
+            Some(PrimitiveConvertedType::Int16),
+            Some(PrimitiveLogicalType::Integer(IntegerType::Int16)),
+            None,
+        )?),
+        DataType::UInt8 => Ok(ParquetType::try_from_primitive(
+            name,
+            PhysicalType::Int32,
+            repetition,
+            Some(PrimitiveConvertedType::Uint8),
+            Some(PrimitiveLogicalType::Integer(IntegerType::UInt8)),
+            None,
+        )?),
+        DataType::UInt16 => Ok(ParquetType::try_from_primitive(
+            name,
+            PhysicalType::Int32,
+            repetition,
+            Some(PrimitiveConvertedType::Uint16),
+            Some(PrimitiveLogicalType::Integer(IntegerType::UInt16)),
+            None,
+        )?),
+        DataType::UInt32 => Ok(ParquetType::try_from_primitive(
+            name,
+            PhysicalType::Int32,
+            repetition,
+            Some(PrimitiveConvertedType::Uint32),
+            Some(PrimitiveLogicalType::Integer(IntegerType::UInt32)),
+            None,
+        )?),
+        DataType::UInt64 => Ok(ParquetType::try_from_primitive(
+            name,
+            PhysicalType::Int64,
+            repetition,
+            Some(PrimitiveConvertedType::Uint64),
+            Some(PrimitiveLogicalType::Integer(IntegerType::UInt64)),
+            None,
+        )?),
+        // no natural representation in parquet; leave it as is.
+        // arrow consumers MAY use the arrow schema in the metadata to parse them.
+        DataType::Timestamp(TimeUnit::Second, _) => Ok(ParquetType::try_from_primitive(
+            name,
+            PhysicalType::Int64,
+            repetition,
+            None,
+            None,
+            None,
+        )?),
+        DataType::Timestamp(time_unit, zone) => Ok(ParquetType::try_from_primitive(
+            name,
+            PhysicalType::Int64,
+            repetition,
+            None,
+            Some(PrimitiveLogicalType::Timestamp {
+                is_adjusted_to_utc: matches!(zone, Some(z) if !z.as_str().is_empty()),
+                unit: match time_unit {
+                    TimeUnit::Second => unreachable!(),
+                    TimeUnit::Millisecond => ParquetTimeUnit::Milliseconds,
+                    TimeUnit::Microsecond => ParquetTimeUnit::Microseconds,
+                    TimeUnit::Nanosecond => ParquetTimeUnit::Nanoseconds,
+                },
+            }),
+            None,
+        )?),
+        // no natural representation in parquet; leave it as is.
+        // arrow consumers MAY use the arrow schema in the metadata to parse them.
+        DataType::Time32(TimeUnit::Second) => Ok(ParquetType::try_from_primitive(
+            name,
+            PhysicalType::Int32,
+            repetition,
+            None,
+            None,
+            None,
+        )?),
+        DataType::Time32(TimeUnit::Millisecond) => Ok(ParquetType::try_from_primitive(
+            name,
+            PhysicalType::Int32,
+            repetition,
+            Some(PrimitiveConvertedType::TimeMillis),
+            Some(PrimitiveLogicalType::Time {
+                is_adjusted_to_utc: false,
+                unit: ParquetTimeUnit::Milliseconds,
+            }),
+            None,
+        )?),
+        DataType::Time64(time_unit) => Ok(ParquetType::try_from_primitive(
+            name,
+            PhysicalType::Int64,
+            repetition,
+            match time_unit {
+                TimeUnit::Microsecond => Some(PrimitiveConvertedType::TimeMicros),
+                TimeUnit::Nanosecond => None,
+                _ => unreachable!(),
+            },
+            Some(PrimitiveLogicalType::Time {
+                is_adjusted_to_utc: false,
+                unit: match time_unit {
+                    TimeUnit::Microsecond => ParquetTimeUnit::Microseconds,
+                    TimeUnit::Nanosecond => ParquetTimeUnit::Nanoseconds,
+                    _ => unreachable!(),
+                },
+            }),
+            None,
+        )?),
+        DataType::Struct(fields) => {
+            if fields.is_empty() {
+                return Err(Error::InvalidArgumentError(
+                    "Parquet does not support writing empty structs".to_string(),
+                ));
+            }
+            // recursively convert children to types/nodes
+            let fields = fields
+                .iter()
+                .map(to_parquet_type)
+                .collect::<Result<Vec<_>>>()?;
+            Ok(ParquetType::from_group(
+                name, repetition, None, None, fields, None,
+            ))
+        },
+        DataType::Dictionary(_, value, _) => {
+            let dict_field = Field::new(name.as_str(), value.as_ref().clone(), field.is_nullable);
+            to_parquet_type(&dict_field)
+        },
+        DataType::FixedSizeBinary(size) => Ok(ParquetType::try_from_primitive(
+            name,
+            PhysicalType::FixedLenByteArray(*size),
+            repetition,
+            None,
+            None,
+            None,
+        )?),
+        DataType::Decimal(precision, scale) => {
+            let precision = *precision;
+            let scale = *scale;
+            let logical_type = Some(PrimitiveLogicalType::Decimal(precision, scale));
+
+            let physical_type = if precision <= 9 {
+                PhysicalType::Int32
+            } else if precision <= 18 {
+                PhysicalType::Int64
+            } else {
+                let len = decimal_length_from_precision(precision);
+                PhysicalType::FixedLenByteArray(len)
+            };
+            Ok(ParquetType::try_from_primitive(
+                name,
+                physical_type,
+                repetition,
+                Some(PrimitiveConvertedType::Decimal(precision, scale)),
+                logical_type,
+                None,
+            )?)
+        },
+        DataType::Decimal256(precision, scale) => {
+            let precision = *precision;
+            let scale = *scale;
+            let logical_type = Some(PrimitiveLogicalType::Decimal(precision, scale));
+
+            if precision <= 9 {
+                Ok(ParquetType::try_from_primitive(
+                    name,
+                    PhysicalType::Int32,
+                    repetition,
+                    Some(PrimitiveConvertedType::Decimal(precision, scale)),
+                    logical_type,
+                    None,
+                )?)
+            } else if precision <= 18 {
+                Ok(ParquetType::try_from_primitive(
+                    name,
+                    PhysicalType::Int64,
+                    repetition,
+                    Some(PrimitiveConvertedType::Decimal(precision, scale)),
+                    logical_type,
+                    None,
+                )?)
+            } else if precision <= 38 {
+                let len = decimal_length_from_precision(precision);
+                Ok(ParquetType::try_from_primitive(
+                    name,
+                    PhysicalType::FixedLenByteArray(len),
+                    repetition,
+                    Some(PrimitiveConvertedType::Decimal(precision, scale)),
+                    logical_type,
+                    None,
+                )?)
+            } else {
+                Ok(ParquetType::try_from_primitive(
+                    name,
+                    PhysicalType::FixedLenByteArray(32),
+                    repetition,
+                    None,
+                    None,
+                    None,
+                )?)
+            }
+        },
+        DataType::Interval(_) => Ok(ParquetType::try_from_primitive(
+            name,
+            PhysicalType::FixedLenByteArray(12),
+            repetition,
+            Some(PrimitiveConvertedType::Interval),
+            None,
+            None,
+        )?),
+        DataType::List(f) | DataType::FixedSizeList(f, _) | DataType::LargeList(f) => {
+            Ok(ParquetType::from_group(
+                name,
+                repetition,
+                Some(GroupConvertedType::List),
+                Some(GroupLogicalType::List),
+                vec![ParquetType::from_group(
+                    "list".to_string(),
+                    Repetition::Repeated,
+                    None,
+                    None,
+                    vec![to_parquet_type(f)?],
+                    None,
+                )],
+                None,
+            ))
+        },
+        DataType::Map(f, _) => Ok(ParquetType::from_group(
+            name,
+            repetition,
+            Some(GroupConvertedType::Map),
+            Some(GroupLogicalType::Map),
+            vec![ParquetType::from_group(
+                "map".to_string(),
+                Repetition::Repeated,
+                None,
+                None,
+                vec![to_parquet_type(f)?],
+                None,
+            )],
+            None,
+        )),
+        other => Err(Error::NotYetImplemented(format!(
+            "Writing the data type {other:?} is not yet implemented"
+        ))),
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/write/sink.rs b/crates/nano-arrow/src/io/parquet/write/sink.rs
new file mode 100644
index 000000000000..d357d7b89c2d
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/sink.rs
@@ -0,0 +1,236 @@
+use std::pin::Pin;
+use std::task::Poll;
+
+use ahash::AHashMap;
+use futures::future::BoxFuture;
+use futures::{AsyncWrite, AsyncWriteExt, FutureExt, Sink, TryFutureExt};
+use parquet2::metadata::KeyValue;
+use parquet2::write::{FileStreamer, WriteOptions as ParquetWriteOptions};
+
+use super::file::add_arrow_schema;
+use super::{Encoding, SchemaDescriptor, WriteOptions};
+use crate::array::Array;
+use crate::chunk::Chunk;
+use crate::datatypes::Schema;
+use crate::error::Error;
+
+/// Sink that writes array [`chunks`](Chunk) as a Parquet file.
+///
+/// Any values in the sink's `metadata` field will be written to the file's footer
+/// when the sink is closed.
+///
+/// # Examples
+///
+/// ```
+/// use futures::SinkExt;
+/// use arrow2::array::{Array, Int32Array};
+/// use arrow2::datatypes::{DataType, Field, Schema};
+/// use arrow2::chunk::Chunk;
+/// use arrow2::io::parquet::write::{Encoding, WriteOptions, CompressionOptions, Version};
+/// # use arrow2::io::parquet::write::FileSink;
+/// # futures::executor::block_on(async move {
+///
+/// let schema = Schema::from(vec![
+///     Field::new("values", DataType::Int32, true),
+/// ]);
+/// let encoding = vec![vec![Encoding::Plain]];
+/// let options = WriteOptions {
+///     write_statistics: true,
+///     compression: CompressionOptions::Uncompressed,
+///     version: Version::V2,
+///     data_pagesize_limit: None,
+/// };
+///
+/// let mut buffer = vec![];
+/// let mut sink = FileSink::try_new(
+///     &mut buffer,
+///     schema,
+///     encoding,
+///     options,
+/// )?;
+///
+/// for i in 0..3 {
+///     let values = Int32Array::from(&[Some(i), None]);
+///     let chunk = Chunk::new(vec![values.boxed()]);
+///     sink.feed(chunk).await?;
+/// }
+/// sink.metadata.insert(String::from("key"), Some(String::from("value")));
+/// sink.close().await?;
+/// # arrow2::error::Result::Ok(())
+/// # }).unwrap();
+/// ```
+pub struct FileSink<'a, W: AsyncWrite + Send + Unpin> {
+    writer: Option<FileStreamer<W>>,
+    task: Option<BoxFuture<'a, Result<Option<FileStreamer<W>>, Error>>>,
+    options: WriteOptions,
+    encodings: Vec<Vec<Encoding>>,
+    schema: Schema,
+    parquet_schema: SchemaDescriptor,
+    /// Key-value metadata that will be written to the file on close.
+    pub metadata: AHashMap<String, Option<String>>,
+}
+
+impl<'a, W> FileSink<'a, W>
+where
+    W: AsyncWrite + Send + Unpin + 'a,
+{
+    /// Create a new sink that writes arrays to the provided `writer`.
+    ///
+    /// # Error
+    /// Iff
+    /// * the Arrow schema can't be converted to a valid Parquet schema.
+    /// * the length of the encodings is different from the number of fields in schema
+    pub fn try_new(
+        writer: W,
+        schema: Schema,
+        encodings: Vec<Vec<Encoding>>,
+        options: WriteOptions,
+    ) -> Result<Self, Error> {
+        if encodings.len() != schema.fields.len() {
+            return Err(Error::InvalidArgumentError(
+                "The number of encodings must equal the number of fields".to_string(),
+            ));
+        }
+
+        let parquet_schema = crate::io::parquet::write::to_parquet_schema(&schema)?;
+        let created_by = Some("Arrow2 - Native Rust implementation of Arrow".to_string());
+        let writer = FileStreamer::new(
+            writer,
+            parquet_schema.clone(),
+            ParquetWriteOptions {
+                version: options.version,
+                write_statistics: options.write_statistics,
+            },
+            created_by,
+        );
+        Ok(Self {
+            writer: Some(writer),
+            task: None,
+            options,
+            schema,
+            encodings,
+            parquet_schema,
+            metadata: AHashMap::default(),
+        })
+    }
+
+    /// The Arrow [`Schema`] for the file.
+    pub fn schema(&self) -> &Schema {
+        &self.schema
+    }
+
+    /// The Parquet [`SchemaDescriptor`] for the file.
+    pub fn parquet_schema(&self) -> &SchemaDescriptor {
+        &self.parquet_schema
+    }
+
+    /// The write options for the file.
+    pub fn options(&self) -> &WriteOptions {
+        &self.options
+    }
+
+    fn poll_complete(
+        &mut self,
+        cx: &mut std::task::Context<'_>,
+    ) -> std::task::Poll<Result<(), Error>> {
+        if let Some(task) = &mut self.task {
+            match futures::ready!(task.poll_unpin(cx)) {
+                Ok(writer) => {
+                    self.task = None;
+                    self.writer = writer;
+                    Poll::Ready(Ok(()))
+                },
+                Err(error) => {
+                    self.task = None;
+                    Poll::Ready(Err(error))
+                },
+            }
+        } else {
+            Poll::Ready(Ok(()))
+        }
+    }
+}
+
+impl<'a, W> Sink<Chunk<Box<dyn Array>>> for FileSink<'a, W>
+where
+    W: AsyncWrite + Send + Unpin + 'a,
+{
+    type Error = Error;
+
+    fn start_send(self: Pin<&mut Self>, item: Chunk<Box<dyn Array>>) -> Result<(), Self::Error> {
+        if self.schema.fields.len() != item.arrays().len() {
+            return Err(Error::InvalidArgumentError(
+                "The number of arrays in the chunk must equal the number of fields in the schema"
+                    .to_string(),
+            ));
+        }
+        let this = self.get_mut();
+        if let Some(mut writer) = this.writer.take() {
+            let rows = crate::io::parquet::write::row_group_iter(
+                item,
+                this.encodings.clone(),
+                this.parquet_schema.fields().to_vec(),
+                this.options,
+            );
+            this.task = Some(Box::pin(async move {
+                writer.write(rows).await?;
+                Ok(Some(writer))
+            }));
+            Ok(())
+        } else {
+            Err(Error::Io(std::io::Error::new(
+                std::io::ErrorKind::UnexpectedEof,
+                "writer closed".to_string(),
+            )))
+        }
+    }
+
+    fn poll_ready(
+        self: Pin<&mut Self>,
+        cx: &mut std::task::Context<'_>,
+    ) -> std::task::Poll<Result<(), Self::Error>> {
+        self.get_mut().poll_complete(cx)
+    }
+
+    fn poll_flush(
+        self: Pin<&mut Self>,
+        cx: &mut std::task::Context<'_>,
+    ) -> std::task::Poll<Result<(), Self::Error>> {
+        self.get_mut().poll_complete(cx)
+    }
+
+    fn poll_close(
+        self: Pin<&mut Self>,
+        cx: &mut std::task::Context<'_>,
+    ) -> std::task::Poll<Result<(), Self::Error>> {
+        let this = self.get_mut();
+        match futures::ready!(this.poll_complete(cx)) {
+            Ok(()) => {
+                let writer = this.writer.take();
+                if let Some(mut writer) = writer {
+                    let meta = std::mem::take(&mut this.metadata);
+                    let metadata = if meta.is_empty() {
+                        None
+                    } else {
+                        Some(
+                            meta.into_iter()
+                                .map(|(k, v)| KeyValue::new(k, v))
+                                .collect::<Vec<_>>(),
+                        )
+                    };
+                    let kv_meta = add_arrow_schema(&this.schema, metadata);
+
+                    this.task = Some(Box::pin(async move {
+                        writer.end(kv_meta).map_err(Error::from).await?;
+                        writer.into_inner().close().map_err(Error::from).await?;
+                        Ok(None)
+                    }));
+                    this.poll_complete(cx)
+                } else {
+                    Poll::Ready(Ok(()))
+                }
+            },
+            Err(error) => Poll::Ready(Err(error)),
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/io/parquet/write/utf8/basic.rs b/crates/nano-arrow/src/io/parquet/write/utf8/basic.rs
new file mode 100644
index 000000000000..39f9c157c988
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/utf8/basic.rs
@@ -0,0 +1,117 @@
+use parquet2::encoding::Encoding;
+use parquet2::page::DataPage;
+use parquet2::schema::types::PrimitiveType;
+use parquet2::statistics::{serialize_statistics, BinaryStatistics, ParquetStatistics, Statistics};
+
+use super::super::binary::{encode_delta, ord_binary};
+use super::super::{utils, WriteOptions};
+use crate::array::{Array, Utf8Array};
+use crate::error::{Error, Result};
+use crate::io::parquet::read::schema::is_nullable;
+use crate::offset::Offset;
+
+pub(crate) fn encode_plain<O: Offset>(
+    array: &Utf8Array<O>,
+    is_optional: bool,
+    buffer: &mut Vec<u8>,
+) {
+    if is_optional {
+        array.iter().for_each(|x| {
+            if let Some(x) = x {
+                // BYTE_ARRAY: first 4 bytes denote length in littleendian.
+                let len = (x.len() as u32).to_le_bytes();
+                buffer.extend_from_slice(&len);
+                buffer.extend_from_slice(x.as_bytes());
+            }
+        })
+    } else {
+        array.values_iter().for_each(|x| {
+            // BYTE_ARRAY: first 4 bytes denote length in littleendian.
+            let len = (x.len() as u32).to_le_bytes();
+            buffer.extend_from_slice(&len);
+            buffer.extend_from_slice(x.as_bytes());
+        })
+    }
+}
+
+pub fn array_to_page<O: Offset>(
+    array: &Utf8Array<O>,
+    options: WriteOptions,
+    type_: PrimitiveType,
+    encoding: Encoding,
+) -> Result<DataPage> {
+    let validity = array.validity();
+    let is_optional = is_nullable(&type_.field_info);
+
+    let mut buffer = vec![];
+    utils::write_def_levels(
+        &mut buffer,
+        is_optional,
+        validity,
+        array.len(),
+        options.version,
+    )?;
+
+    let definition_levels_byte_length = buffer.len();
+
+    match encoding {
+        Encoding::Plain => encode_plain(array, is_optional, &mut buffer),
+        Encoding::DeltaLengthByteArray => encode_delta(
+            array.values(),
+            array.offsets().buffer(),
+            array.validity(),
+            is_optional,
+            &mut buffer,
+        ),
+        _ => {
+            return Err(Error::InvalidArgumentError(format!(
+                "Datatype {:?} cannot be encoded by {:?} encoding",
+                array.data_type(),
+                encoding
+            )))
+        },
+    }
+
+    let statistics = if options.write_statistics {
+        Some(build_statistics(array, type_.clone()))
+    } else {
+        None
+    };
+
+    utils::build_plain_page(
+        buffer,
+        array.len(),
+        array.len(),
+        array.null_count(),
+        0,
+        definition_levels_byte_length,
+        statistics,
+        type_,
+        options,
+        encoding,
+    )
+}
+
+pub(crate) fn build_statistics<O: Offset>(
+    array: &Utf8Array<O>,
+    primitive_type: PrimitiveType,
+) -> ParquetStatistics {
+    let statistics = &BinaryStatistics {
+        primitive_type,
+        null_count: Some(array.null_count() as i64),
+        distinct_count: None,
+        max_value: array
+            .iter()
+            .flatten()
+            .map(|x| x.as_bytes())
+            .max_by(|x, y| ord_binary(x, y))
+            .map(|x| x.to_vec()),
+        min_value: array
+            .iter()
+            .flatten()
+            .map(|x| x.as_bytes())
+            .min_by(|x, y| ord_binary(x, y))
+            .map(|x| x.to_vec()),
+    } as &dyn Statistics;
+    serialize_statistics(statistics)
+}
diff --git a/crates/nano-arrow/src/io/parquet/write/utf8/mod.rs b/crates/nano-arrow/src/io/parquet/write/utf8/mod.rs
new file mode 100644
index 000000000000..e4ef46599e2c
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/utf8/mod.rs
@@ -0,0 +1,6 @@
+mod basic;
+mod nested;
+
+pub use basic::array_to_page;
+pub(crate) use basic::{build_statistics, encode_plain};
+pub use nested::array_to_page as nested_array_to_page;
diff --git a/crates/nano-arrow/src/io/parquet/write/utf8/nested.rs b/crates/nano-arrow/src/io/parquet/write/utf8/nested.rs
new file mode 100644
index 000000000000..43767246d194
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/utf8/nested.rs
@@ -0,0 +1,48 @@
+use parquet2::encoding::Encoding;
+use parquet2::page::DataPage;
+use parquet2::schema::types::PrimitiveType;
+
+use super::super::{nested, utils, WriteOptions};
+use super::basic::{build_statistics, encode_plain};
+use crate::array::{Array, Utf8Array};
+use crate::error::Result;
+use crate::io::parquet::read::schema::is_nullable;
+use crate::io::parquet::write::Nested;
+use crate::offset::Offset;
+
+pub fn array_to_page<O>(
+    array: &Utf8Array<O>,
+    options: WriteOptions,
+    type_: PrimitiveType,
+    nested: &[Nested],
+) -> Result<DataPage>
+where
+    O: Offset,
+{
+    let is_optional = is_nullable(&type_.field_info);
+
+    let mut buffer = vec![];
+    let (repetition_levels_byte_length, definition_levels_byte_length) =
+        nested::write_rep_and_def(options.version, nested, &mut buffer)?;
+
+    encode_plain(array, is_optional, &mut buffer);
+
+    let statistics = if options.write_statistics {
+        Some(build_statistics(array, type_.clone()))
+    } else {
+        None
+    };
+
+    utils::build_plain_page(
+        buffer,
+        nested::num_values(nested),
+        nested[0].len(),
+        array.null_count(),
+        repetition_levels_byte_length,
+        definition_levels_byte_length,
+        statistics,
+        type_,
+        options,
+        Encoding::Plain,
+    )
+}
diff --git a/crates/nano-arrow/src/io/parquet/write/utils.rs b/crates/nano-arrow/src/io/parquet/write/utils.rs
new file mode 100644
index 000000000000..caaba98a07fe
--- /dev/null
+++ b/crates/nano-arrow/src/io/parquet/write/utils.rs
@@ -0,0 +1,146 @@
+use parquet2::compression::CompressionOptions;
+use parquet2::encoding::hybrid_rle::encode_bool;
+use parquet2::encoding::Encoding;
+use parquet2::metadata::Descriptor;
+use parquet2::page::{DataPage, DataPageHeader, DataPageHeaderV1, DataPageHeaderV2};
+use parquet2::schema::types::PrimitiveType;
+use parquet2::statistics::ParquetStatistics;
+
+use super::{Version, WriteOptions};
+use crate::bitmap::Bitmap;
+use crate::error::Result;
+
+fn encode_iter_v1<I: Iterator<Item = bool>>(buffer: &mut Vec<u8>, iter: I) -> Result<()> {
+    buffer.extend_from_slice(&[0; 4]);
+    let start = buffer.len();
+    encode_bool(buffer, iter)?;
+    let end = buffer.len();
+    let length = end - start;
+
+    // write the first 4 bytes as length
+    let length = (length as i32).to_le_bytes();
+    (0..4).for_each(|i| buffer[start - 4 + i] = length[i]);
+    Ok(())
+}
+
+fn encode_iter_v2<I: Iterator<Item = bool>>(writer: &mut Vec<u8>, iter: I) -> Result<()> {
+    Ok(encode_bool(writer, iter)?)
+}
+
+fn encode_iter<I: Iterator<Item = bool>>(
+    writer: &mut Vec<u8>,
+    iter: I,
+    version: Version,
+) -> Result<()> {
+    match version {
+        Version::V1 => encode_iter_v1(writer, iter),
+        Version::V2 => encode_iter_v2(writer, iter),
+    }
+}
+
+/// writes the def levels to a `Vec<u8>` and returns it.
+pub fn write_def_levels(
+    writer: &mut Vec<u8>,
+    is_optional: bool,
+    validity: Option<&Bitmap>,
+    len: usize,
+    version: Version,
+) -> Result<()> {
+    // encode def levels
+    match (is_optional, validity) {
+        (true, Some(validity)) => encode_iter(writer, validity.iter(), version),
+        (true, None) => encode_iter(writer, std::iter::repeat(true).take(len), version),
+        _ => Ok(()), // is required => no def levels
+    }
+}
+
+#[allow(clippy::too_many_arguments)]
+pub fn build_plain_page(
+    buffer: Vec<u8>,
+    num_values: usize,
+    num_rows: usize,
+    null_count: usize,
+    repetition_levels_byte_length: usize,
+    definition_levels_byte_length: usize,
+    statistics: Option<ParquetStatistics>,
+    type_: PrimitiveType,
+    options: WriteOptions,
+    encoding: Encoding,
+) -> Result<DataPage> {
+    let header = match options.version {
+        Version::V1 => DataPageHeader::V1(DataPageHeaderV1 {
+            num_values: num_values as i32,
+            encoding: encoding.into(),
+            definition_level_encoding: Encoding::Rle.into(),
+            repetition_level_encoding: Encoding::Rle.into(),
+            statistics,
+        }),
+        Version::V2 => DataPageHeader::V2(DataPageHeaderV2 {
+            num_values: num_values as i32,
+            encoding: encoding.into(),
+            num_nulls: null_count as i32,
+            num_rows: num_rows as i32,
+            definition_levels_byte_length: definition_levels_byte_length as i32,
+            repetition_levels_byte_length: repetition_levels_byte_length as i32,
+            is_compressed: Some(options.compression != CompressionOptions::Uncompressed),
+            statistics,
+        }),
+    };
+    Ok(DataPage::new(
+        header,
+        buffer,
+        Descriptor {
+            primitive_type: type_,
+            max_def_level: 0,
+            max_rep_level: 0,
+        },
+        Some(num_rows),
+    ))
+}
+
+/// Auxiliary iterator adapter to declare the size hint of an iterator.
+pub(super) struct ExactSizedIter<T, I: Iterator<Item = T>> {
+    iter: I,
+    remaining: usize,
+}
+
+impl<T, I: Iterator<Item = T> + Clone> Clone for ExactSizedIter<T, I> {
+    fn clone(&self) -> Self {
+        Self {
+            iter: self.iter.clone(),
+            remaining: self.remaining,
+        }
+    }
+}
+
+impl<T, I: Iterator<Item = T>> ExactSizedIter<T, I> {
+    pub fn new(iter: I, length: usize) -> Self {
+        Self {
+            iter,
+            remaining: length,
+        }
+    }
+}
+
+impl<T, I: Iterator<Item = T>> Iterator for ExactSizedIter<T, I> {
+    type Item = T;
+
+    #[inline]
+    fn next(&mut self) -> Option<Self::Item> {
+        self.iter.next().map(|x| {
+            self.remaining -= 1;
+            x
+        })
+    }
+
+    #[inline]
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        (self.remaining, Some(self.remaining))
+    }
+}
+
+/// Returns the number of bits needed to bitpack `max`
+#[inline]
+pub fn get_bit_width(max: u64) -> u32 {
+    64 - max.leading_zeros()
+}
diff --git a/crates/nano-arrow/src/lib.rs b/crates/nano-arrow/src/lib.rs
new file mode 100644
index 000000000000..c26b3e1a0b28
--- /dev/null
+++ b/crates/nano-arrow/src/lib.rs
@@ -0,0 +1,42 @@
+// So that we have more control over what is `unsafe` inside an `unsafe` block
+#![allow(unused_unsafe)]
+//
+#![allow(clippy::len_without_is_empty)]
+// this landed on 1.60. Let's not force everyone to bump just yet
+#![allow(clippy::unnecessary_lazy_evaluations)]
+// Trait objects must be returned as a &Box<dyn Array> so that they can be cloned
+#![allow(clippy::borrowed_box)]
+// Allow type complexity warning to avoid API break.
+#![allow(clippy::type_complexity)]
+#![cfg_attr(docsrs, feature(doc_cfg))]
+#![cfg_attr(feature = "simd", feature(portable_simd))]
+#![cfg_attr(feature = "nightly_build", feature(build_hasher_simple_hash_one))]
+
+#[macro_use]
+pub mod array;
+pub mod bitmap;
+pub mod buffer;
+pub mod chunk;
+pub mod error;
+#[cfg(feature = "io_ipc")]
+#[cfg_attr(docsrs, doc(cfg(feature = "io_ipc")))]
+pub mod mmap;
+
+pub mod offset;
+pub mod scalar;
+pub mod trusted_len;
+pub mod types;
+
+pub mod compute;
+pub mod io;
+pub mod temporal_conversions;
+
+pub mod datatypes;
+
+pub mod ffi;
+pub mod util;
+
+// re-exported because we return `Either` in our public API
+// re-exported to construct dictionaries
+pub use ahash::AHashMap;
+pub use either::Either;
diff --git a/crates/nano-arrow/src/mmap/array.rs b/crates/nano-arrow/src/mmap/array.rs
new file mode 100644
index 000000000000..8efd6afcd671
--- /dev/null
+++ b/crates/nano-arrow/src/mmap/array.rs
@@ -0,0 +1,568 @@
+use std::collections::VecDeque;
+use std::sync::Arc;
+
+use crate::array::{Array, DictionaryKey, FixedSizeListArray, ListArray, StructArray};
+use crate::datatypes::DataType;
+use crate::error::Error;
+use crate::ffi::mmap::create_array;
+use crate::ffi::{export_array_to_c, try_from, ArrowArray, InternalArrowArray};
+use crate::io::ipc::read::{Dictionaries, IpcBuffer, Node, OutOfSpecKind};
+use crate::io::ipc::IpcField;
+use crate::offset::Offset;
+use crate::types::NativeType;
+
+fn get_buffer_bounds(buffers: &mut VecDeque<IpcBuffer>) -> Result<(usize, usize), Error> {
+    let buffer = buffers
+        .pop_front()
+        .ok_or_else(|| Error::from(OutOfSpecKind::ExpectedBuffer))?;
+
+    let offset: usize = buffer
+        .offset()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let length: usize = buffer
+        .length()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    Ok((offset, length))
+}
+
+fn get_buffer<'a, T: NativeType>(
+    data: &'a [u8],
+    block_offset: usize,
+    buffers: &mut VecDeque<IpcBuffer>,
+    num_rows: usize,
+) -> Result<&'a [u8], Error> {
+    let (offset, length) = get_buffer_bounds(buffers)?;
+
+    // verify that they are in-bounds
+    let values = data
+        .get(block_offset + offset..block_offset + offset + length)
+        .ok_or_else(|| Error::OutOfSpec("buffer out of bounds".to_string()))?;
+
+    // validate alignment
+    let v: &[T] = bytemuck::try_cast_slice(values)
+        .map_err(|_| Error::OutOfSpec("buffer not aligned for mmap".to_string()))?;
+
+    if v.len() < num_rows {
+        return Err(Error::OutOfSpec(
+            "buffer's length is too small in mmap".to_string(),
+        ));
+    }
+
+    Ok(values)
+}
+
+fn get_validity<'a>(
+    data: &'a [u8],
+    block_offset: usize,
+    buffers: &mut VecDeque<IpcBuffer>,
+    null_count: usize,
+) -> Result<Option<&'a [u8]>, Error> {
+    let validity = get_buffer_bounds(buffers)?;
+    let (offset, length) = validity;
+
+    Ok(if null_count > 0 {
+        // verify that they are in-bounds and get its pointer
+        Some(
+            data.get(block_offset + offset..block_offset + offset + length)
+                .ok_or_else(|| Error::OutOfSpec("buffer out of bounds".to_string()))?,
+        )
+    } else {
+        None
+    })
+}
+
+fn mmap_binary<O: Offset, T: AsRef<[u8]>>(
+    data: Arc<T>,
+    node: &Node,
+    block_offset: usize,
+    buffers: &mut VecDeque<IpcBuffer>,
+) -> Result<ArrowArray, Error> {
+    let num_rows: usize = node
+        .length()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let null_count: usize = node
+        .null_count()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let data_ref = data.as_ref().as_ref();
+
+    let validity = get_validity(data_ref, block_offset, buffers, null_count)?.map(|x| x.as_ptr());
+
+    let offsets = get_buffer::<O>(data_ref, block_offset, buffers, num_rows + 1)?.as_ptr();
+    let values = get_buffer::<u8>(data_ref, block_offset, buffers, 0)?.as_ptr();
+
+    // NOTE: offsets and values invariants are _not_ validated
+    Ok(unsafe {
+        create_array(
+            data,
+            num_rows,
+            null_count,
+            [validity, Some(offsets), Some(values)].into_iter(),
+            [].into_iter(),
+            None,
+            None,
+        )
+    })
+}
+
+fn mmap_fixed_size_binary<T: AsRef<[u8]>>(
+    data: Arc<T>,
+    node: &Node,
+    block_offset: usize,
+    buffers: &mut VecDeque<IpcBuffer>,
+    data_type: &DataType,
+) -> Result<ArrowArray, Error> {
+    let bytes_per_row = if let DataType::FixedSizeBinary(bytes_per_row) = data_type {
+        bytes_per_row
+    } else {
+        return Err(Error::from(OutOfSpecKind::InvalidDataType));
+    };
+
+    let num_rows: usize = node
+        .length()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let null_count: usize = node
+        .null_count()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let data_ref = data.as_ref().as_ref();
+
+    let validity = get_validity(data_ref, block_offset, buffers, null_count)?.map(|x| x.as_ptr());
+    let values =
+        get_buffer::<u8>(data_ref, block_offset, buffers, num_rows * bytes_per_row)?.as_ptr();
+
+    Ok(unsafe {
+        create_array(
+            data,
+            num_rows,
+            null_count,
+            [validity, Some(values)].into_iter(),
+            [].into_iter(),
+            None,
+            None,
+        )
+    })
+}
+
+fn mmap_null<T: AsRef<[u8]>>(
+    data: Arc<T>,
+    node: &Node,
+    _block_offset: usize,
+    _buffers: &mut VecDeque<IpcBuffer>,
+) -> Result<ArrowArray, Error> {
+    let num_rows: usize = node
+        .length()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let null_count: usize = node
+        .null_count()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    Ok(unsafe {
+        create_array(
+            data,
+            num_rows,
+            null_count,
+            [].into_iter(),
+            [].into_iter(),
+            None,
+            None,
+        )
+    })
+}
+
+fn mmap_boolean<T: AsRef<[u8]>>(
+    data: Arc<T>,
+    node: &Node,
+    block_offset: usize,
+    buffers: &mut VecDeque<IpcBuffer>,
+) -> Result<ArrowArray, Error> {
+    let num_rows: usize = node
+        .length()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let null_count: usize = node
+        .null_count()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let data_ref = data.as_ref().as_ref();
+
+    let validity = get_validity(data_ref, block_offset, buffers, null_count)?.map(|x| x.as_ptr());
+
+    let values = get_buffer_bounds(buffers)?;
+    let (offset, length) = values;
+
+    // verify that they are in-bounds and get its pointer
+    let values = data_ref[block_offset + offset..block_offset + offset + length].as_ptr();
+
+    Ok(unsafe {
+        create_array(
+            data,
+            num_rows,
+            null_count,
+            [validity, Some(values)].into_iter(),
+            [].into_iter(),
+            None,
+            None,
+        )
+    })
+}
+
+fn mmap_primitive<P: NativeType, T: AsRef<[u8]>>(
+    data: Arc<T>,
+    node: &Node,
+    block_offset: usize,
+    buffers: &mut VecDeque<IpcBuffer>,
+) -> Result<ArrowArray, Error> {
+    let data_ref = data.as_ref().as_ref();
+
+    let num_rows: usize = node
+        .length()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let null_count: usize = node
+        .null_count()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let validity = get_validity(data_ref, block_offset, buffers, null_count)?.map(|x| x.as_ptr());
+
+    let values = get_buffer::<P>(data_ref, block_offset, buffers, num_rows)?.as_ptr();
+
+    Ok(unsafe {
+        create_array(
+            data,
+            num_rows,
+            null_count,
+            [validity, Some(values)].into_iter(),
+            [].into_iter(),
+            None,
+            None,
+        )
+    })
+}
+
+#[allow(clippy::too_many_arguments)]
+fn mmap_list<O: Offset, T: AsRef<[u8]>>(
+    data: Arc<T>,
+    node: &Node,
+    block_offset: usize,
+    data_type: &DataType,
+    ipc_field: &IpcField,
+    dictionaries: &Dictionaries,
+    field_nodes: &mut VecDeque<Node>,
+    buffers: &mut VecDeque<IpcBuffer>,
+) -> Result<ArrowArray, Error> {
+    let child = ListArray::<O>::try_get_child(data_type)?.data_type();
+
+    let num_rows: usize = node
+        .length()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let null_count: usize = node
+        .null_count()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let data_ref = data.as_ref().as_ref();
+
+    let validity = get_validity(data_ref, block_offset, buffers, null_count)?.map(|x| x.as_ptr());
+
+    let offsets = get_buffer::<O>(data_ref, block_offset, buffers, num_rows + 1)?.as_ptr();
+
+    let values = get_array(
+        data.clone(),
+        block_offset,
+        child,
+        &ipc_field.fields[0],
+        dictionaries,
+        field_nodes,
+        buffers,
+    )?;
+
+    // NOTE: offsets and values invariants are _not_ validated
+    Ok(unsafe {
+        create_array(
+            data,
+            num_rows,
+            null_count,
+            [validity, Some(offsets)].into_iter(),
+            [values].into_iter(),
+            None,
+            None,
+        )
+    })
+}
+
+#[allow(clippy::too_many_arguments)]
+fn mmap_fixed_size_list<T: AsRef<[u8]>>(
+    data: Arc<T>,
+    node: &Node,
+    block_offset: usize,
+    data_type: &DataType,
+    ipc_field: &IpcField,
+    dictionaries: &Dictionaries,
+    field_nodes: &mut VecDeque<Node>,
+    buffers: &mut VecDeque<IpcBuffer>,
+) -> Result<ArrowArray, Error> {
+    let child = FixedSizeListArray::try_child_and_size(data_type)?
+        .0
+        .data_type();
+
+    let num_rows: usize = node
+        .length()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let null_count: usize = node
+        .null_count()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let data_ref = data.as_ref().as_ref();
+
+    let validity = get_validity(data_ref, block_offset, buffers, null_count)?.map(|x| x.as_ptr());
+
+    let values = get_array(
+        data.clone(),
+        block_offset,
+        child,
+        &ipc_field.fields[0],
+        dictionaries,
+        field_nodes,
+        buffers,
+    )?;
+
+    Ok(unsafe {
+        create_array(
+            data,
+            num_rows,
+            null_count,
+            [validity].into_iter(),
+            [values].into_iter(),
+            None,
+            None,
+        )
+    })
+}
+
+#[allow(clippy::too_many_arguments)]
+fn mmap_struct<T: AsRef<[u8]>>(
+    data: Arc<T>,
+    node: &Node,
+    block_offset: usize,
+    data_type: &DataType,
+    ipc_field: &IpcField,
+    dictionaries: &Dictionaries,
+    field_nodes: &mut VecDeque<Node>,
+    buffers: &mut VecDeque<IpcBuffer>,
+) -> Result<ArrowArray, Error> {
+    let children = StructArray::try_get_fields(data_type)?;
+
+    let num_rows: usize = node
+        .length()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let null_count: usize = node
+        .null_count()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let data_ref = data.as_ref().as_ref();
+
+    let validity = get_validity(data_ref, block_offset, buffers, null_count)?.map(|x| x.as_ptr());
+
+    let values = children
+        .iter()
+        .map(|f| &f.data_type)
+        .zip(ipc_field.fields.iter())
+        .map(|(child, ipc)| {
+            get_array(
+                data.clone(),
+                block_offset,
+                child,
+                ipc,
+                dictionaries,
+                field_nodes,
+                buffers,
+            )
+        })
+        .collect::<Result<Vec<_>, Error>>()?;
+
+    Ok(unsafe {
+        create_array(
+            data,
+            num_rows,
+            null_count,
+            [validity].into_iter(),
+            values.into_iter(),
+            None,
+            None,
+        )
+    })
+}
+
+#[allow(clippy::too_many_arguments)]
+fn mmap_dict<K: DictionaryKey, T: AsRef<[u8]>>(
+    data: Arc<T>,
+    node: &Node,
+    block_offset: usize,
+    _: &DataType,
+    ipc_field: &IpcField,
+    dictionaries: &Dictionaries,
+    _: &mut VecDeque<Node>,
+    buffers: &mut VecDeque<IpcBuffer>,
+) -> Result<ArrowArray, Error> {
+    let num_rows: usize = node
+        .length()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let null_count: usize = node
+        .null_count()
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let data_ref = data.as_ref().as_ref();
+
+    let dictionary = dictionaries
+        .get(&ipc_field.dictionary_id.unwrap())
+        .ok_or_else(|| Error::oos("Missing dictionary"))?
+        .clone();
+
+    let validity = get_validity(data_ref, block_offset, buffers, null_count)?.map(|x| x.as_ptr());
+
+    let values = get_buffer::<K>(data_ref, block_offset, buffers, num_rows)?.as_ptr();
+
+    Ok(unsafe {
+        create_array(
+            data,
+            num_rows,
+            null_count,
+            [validity, Some(values)].into_iter(),
+            [].into_iter(),
+            Some(export_array_to_c(dictionary)),
+            None,
+        )
+    })
+}
+
+fn get_array<T: AsRef<[u8]>>(
+    data: Arc<T>,
+    block_offset: usize,
+    data_type: &DataType,
+    ipc_field: &IpcField,
+    dictionaries: &Dictionaries,
+    field_nodes: &mut VecDeque<Node>,
+    buffers: &mut VecDeque<IpcBuffer>,
+) -> Result<ArrowArray, Error> {
+    use crate::datatypes::PhysicalType::*;
+    let node = field_nodes
+        .pop_front()
+        .ok_or_else(|| Error::from(OutOfSpecKind::ExpectedBuffer))?;
+
+    match data_type.to_physical_type() {
+        Null => mmap_null(data, &node, block_offset, buffers),
+        Boolean => mmap_boolean(data, &node, block_offset, buffers),
+        Primitive(p) => with_match_primitive_type!(p, |$T| {
+            mmap_primitive::<$T, _>(data, &node, block_offset, buffers)
+        }),
+        Utf8 | Binary => mmap_binary::<i32, _>(data, &node, block_offset, buffers),
+        FixedSizeBinary => mmap_fixed_size_binary(data, &node, block_offset, buffers, data_type),
+        LargeBinary | LargeUtf8 => mmap_binary::<i64, _>(data, &node, block_offset, buffers),
+        List => mmap_list::<i32, _>(
+            data,
+            &node,
+            block_offset,
+            data_type,
+            ipc_field,
+            dictionaries,
+            field_nodes,
+            buffers,
+        ),
+        LargeList => mmap_list::<i64, _>(
+            data,
+            &node,
+            block_offset,
+            data_type,
+            ipc_field,
+            dictionaries,
+            field_nodes,
+            buffers,
+        ),
+        FixedSizeList => mmap_fixed_size_list(
+            data,
+            &node,
+            block_offset,
+            data_type,
+            ipc_field,
+            dictionaries,
+            field_nodes,
+            buffers,
+        ),
+        Struct => mmap_struct(
+            data,
+            &node,
+            block_offset,
+            data_type,
+            ipc_field,
+            dictionaries,
+            field_nodes,
+            buffers,
+        ),
+        Dictionary(key_type) => match_integer_type!(key_type, |$T| {
+            mmap_dict::<$T, _>(
+                data,
+                &node,
+                block_offset,
+                data_type,
+                ipc_field,
+                dictionaries,
+                field_nodes,
+                buffers,
+            )
+        }),
+        _ => todo!(),
+    }
+}
+
+/// Maps a memory region to an [`Array`].
+pub(crate) unsafe fn mmap<T: AsRef<[u8]>>(
+    data: Arc<T>,
+    block_offset: usize,
+    data_type: DataType,
+    ipc_field: &IpcField,
+    dictionaries: &Dictionaries,
+    field_nodes: &mut VecDeque<Node>,
+    buffers: &mut VecDeque<IpcBuffer>,
+) -> Result<Box<dyn Array>, Error> {
+    let array = get_array(
+        data,
+        block_offset,
+        &data_type,
+        ipc_field,
+        dictionaries,
+        field_nodes,
+        buffers,
+    )?;
+    // The unsafety comes from the fact that `array` is not necessarily valid -
+    // the IPC file may be corrupted (e.g. invalid offsets or non-utf8 data)
+    unsafe { try_from(InternalArrowArray::new(array, data_type)) }
+}
diff --git a/crates/nano-arrow/src/mmap/mod.rs b/crates/nano-arrow/src/mmap/mod.rs
new file mode 100644
index 000000000000..58265892ea57
--- /dev/null
+++ b/crates/nano-arrow/src/mmap/mod.rs
@@ -0,0 +1,227 @@
+//! Memory maps regions defined on the IPC format into [`Array`].
+use std::collections::VecDeque;
+use std::sync::Arc;
+
+mod array;
+
+use arrow_format::ipc::planus::ReadAsRoot;
+use arrow_format::ipc::{Block, MessageRef, RecordBatchRef};
+
+use crate::array::Array;
+use crate::chunk::Chunk;
+use crate::datatypes::{DataType, Field};
+use crate::error::Error;
+use crate::io::ipc::read::file::{get_dictionary_batch, get_record_batch};
+use crate::io::ipc::read::{
+    first_dict_field, Dictionaries, FileMetadata, IpcBuffer, Node, OutOfSpecKind,
+};
+use crate::io::ipc::{IpcField, CONTINUATION_MARKER};
+
+fn read_message(
+    mut bytes: &[u8],
+    block: arrow_format::ipc::Block,
+) -> Result<(MessageRef, usize), Error> {
+    let offset: usize = block
+        .offset
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let block_length: usize = block
+        .meta_data_length
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    bytes = &bytes[offset..];
+    let mut message_length = bytes[..4].try_into().unwrap();
+    bytes = &bytes[4..];
+
+    if message_length == CONTINUATION_MARKER {
+        // continuation marker encountered, read message next
+        message_length = bytes[..4].try_into().unwrap();
+        bytes = &bytes[4..];
+    };
+
+    let message_length: usize = i32::from_le_bytes(message_length)
+        .try_into()
+        .map_err(|_| Error::from(OutOfSpecKind::NegativeFooterLength))?;
+
+    let message = arrow_format::ipc::MessageRef::read_as_root(&bytes[..message_length])
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferMessage(err)))?;
+
+    Ok((message, offset + block_length))
+}
+
+fn get_buffers_nodes(
+    batch: RecordBatchRef,
+) -> Result<(VecDeque<IpcBuffer>, VecDeque<Node>), Error> {
+    let compression = batch.compression()?;
+    if compression.is_some() {
+        return Err(Error::nyi(
+            "mmap can only be done on uncompressed IPC files",
+        ));
+    }
+
+    let buffers = batch
+        .buffers()
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferBuffers(err)))?
+        .ok_or_else(|| Error::from(OutOfSpecKind::MissingMessageBuffers))?;
+    let buffers = buffers.iter().collect::<VecDeque<_>>();
+
+    let field_nodes = batch
+        .nodes()
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferNodes(err)))?
+        .ok_or_else(|| Error::from(OutOfSpecKind::MissingMessageNodes))?;
+    let field_nodes = field_nodes.iter().collect::<VecDeque<_>>();
+
+    Ok((buffers, field_nodes))
+}
+
+unsafe fn _mmap_record<T: AsRef<[u8]>>(
+    fields: &[Field],
+    ipc_fields: &[IpcField],
+    data: Arc<T>,
+    batch: RecordBatchRef,
+    offset: usize,
+    dictionaries: &Dictionaries,
+) -> Result<Chunk<Box<dyn Array>>, Error> {
+    let (mut buffers, mut field_nodes) = get_buffers_nodes(batch)?;
+
+    fields
+        .iter()
+        .map(|f| &f.data_type)
+        .cloned()
+        .zip(ipc_fields)
+        .map(|(data_type, ipc_field)| {
+            array::mmap(
+                data.clone(),
+                offset,
+                data_type,
+                ipc_field,
+                dictionaries,
+                &mut field_nodes,
+                &mut buffers,
+            )
+        })
+        .collect::<Result<_, Error>>()
+        .and_then(Chunk::try_new)
+}
+
+unsafe fn _mmap_unchecked<T: AsRef<[u8]>>(
+    fields: &[Field],
+    ipc_fields: &[IpcField],
+    data: Arc<T>,
+    block: Block,
+    dictionaries: &Dictionaries,
+) -> Result<Chunk<Box<dyn Array>>, Error> {
+    let (message, offset) = read_message(data.as_ref().as_ref(), block)?;
+    let batch = get_record_batch(message)?;
+    _mmap_record(
+        fields,
+        ipc_fields,
+        data.clone(),
+        batch,
+        offset,
+        dictionaries,
+    )
+}
+
+/// Memory maps an record batch from an IPC file into a [`Chunk`].
+/// # Errors
+/// This function errors when:
+/// * The IPC file is not valid
+/// * the buffers on the file are un-aligned with their corresponding data. This can happen when:
+///     * the file was written with 8-bit alignment
+///     * the file contains type decimal 128 or 256
+/// # Safety
+/// The caller must ensure that `data` contains a valid buffers, for example:
+/// * Offsets in variable-sized containers must be in-bounds and increasing
+/// * Utf8 data is valid
+pub unsafe fn mmap_unchecked<T: AsRef<[u8]>>(
+    metadata: &FileMetadata,
+    dictionaries: &Dictionaries,
+    data: Arc<T>,
+    chunk: usize,
+) -> Result<Chunk<Box<dyn Array>>, Error> {
+    let block = metadata.blocks[chunk];
+
+    let (message, offset) = read_message(data.as_ref().as_ref(), block)?;
+    let batch = get_record_batch(message)?;
+    _mmap_record(
+        &metadata.schema.fields,
+        &metadata.ipc_schema.fields,
+        data.clone(),
+        batch,
+        offset,
+        dictionaries,
+    )
+}
+
+unsafe fn mmap_dictionary<T: AsRef<[u8]>>(
+    metadata: &FileMetadata,
+    data: Arc<T>,
+    block: Block,
+    dictionaries: &mut Dictionaries,
+) -> Result<(), Error> {
+    let (message, offset) = read_message(data.as_ref().as_ref(), block)?;
+    let batch = get_dictionary_batch(&message)?;
+
+    let id = batch
+        .id()
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferId(err)))?;
+    let (first_field, first_ipc_field) =
+        first_dict_field(id, &metadata.schema.fields, &metadata.ipc_schema.fields)?;
+
+    let batch = batch
+        .data()
+        .map_err(|err| Error::from(OutOfSpecKind::InvalidFlatbufferData(err)))?
+        .ok_or_else(|| Error::from(OutOfSpecKind::MissingData))?;
+
+    let value_type =
+        if let DataType::Dictionary(_, value_type, _) = first_field.data_type.to_logical_type() {
+            value_type.as_ref()
+        } else {
+            return Err(Error::from(OutOfSpecKind::InvalidIdDataType {
+                requested_id: id,
+            }));
+        };
+
+    // Make a fake schema for the dictionary batch.
+    let field = Field::new("", value_type.clone(), false);
+
+    let chunk = _mmap_record(
+        &[field],
+        &[first_ipc_field.clone()],
+        data.clone(),
+        batch,
+        offset,
+        dictionaries,
+    )?;
+
+    dictionaries.insert(id, chunk.into_arrays().pop().unwrap());
+
+    Ok(())
+}
+
+/// Memory maps dictionaries from an IPC file into
+/// # Safety
+/// The caller must ensure that `data` contains a valid buffers, for example:
+/// * Offsets in variable-sized containers must be in-bounds and increasing
+/// * Utf8 data is valid
+pub unsafe fn mmap_dictionaries_unchecked<T: AsRef<[u8]>>(
+    metadata: &FileMetadata,
+    data: Arc<T>,
+) -> Result<Dictionaries, Error> {
+    let blocks = if let Some(blocks) = &metadata.dictionaries {
+        blocks
+    } else {
+        return Ok(Default::default());
+    };
+
+    let mut dictionaries = Default::default();
+
+    blocks
+        .iter()
+        .cloned()
+        .try_for_each(|block| mmap_dictionary(metadata, data.clone(), block, &mut dictionaries))?;
+    Ok(dictionaries)
+}
diff --git a/crates/nano-arrow/src/offset.rs b/crates/nano-arrow/src/offset.rs
new file mode 100644
index 000000000000..409e695ba66a
--- /dev/null
+++ b/crates/nano-arrow/src/offset.rs
@@ -0,0 +1,543 @@
+//! Contains the declaration of [`Offset`]
+use std::hint::unreachable_unchecked;
+
+use crate::buffer::Buffer;
+use crate::error::Error;
+pub use crate::types::Offset;
+
+/// A wrapper type of [`Vec<O>`] representing the invariants of Arrow's offsets.
+/// It is guaranteed to (sound to assume that):
+/// * every element is `>= 0`
+/// * element at position `i` is >= than element at position `i-1`.
+#[derive(Debug, Clone, PartialEq, Eq)]
+pub struct Offsets<O: Offset>(Vec<O>);
+
+impl<O: Offset> Default for Offsets<O> {
+    #[inline]
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl<O: Offset> TryFrom<Vec<O>> for Offsets<O> {
+    type Error = Error;
+
+    #[inline]
+    fn try_from(offsets: Vec<O>) -> Result<Self, Self::Error> {
+        try_check_offsets(&offsets)?;
+        Ok(Self(offsets))
+    }
+}
+
+impl<O: Offset> TryFrom<Buffer<O>> for OffsetsBuffer<O> {
+    type Error = Error;
+
+    #[inline]
+    fn try_from(offsets: Buffer<O>) -> Result<Self, Self::Error> {
+        try_check_offsets(&offsets)?;
+        Ok(Self(offsets))
+    }
+}
+
+impl<O: Offset> TryFrom<Vec<O>> for OffsetsBuffer<O> {
+    type Error = Error;
+
+    #[inline]
+    fn try_from(offsets: Vec<O>) -> Result<Self, Self::Error> {
+        try_check_offsets(&offsets)?;
+        Ok(Self(offsets.into()))
+    }
+}
+
+impl<O: Offset> From<Offsets<O>> for OffsetsBuffer<O> {
+    #[inline]
+    fn from(offsets: Offsets<O>) -> Self {
+        Self(offsets.0.into())
+    }
+}
+
+impl<O: Offset> Offsets<O> {
+    /// Returns an empty [`Offsets`] (i.e. with a single element, the zero)
+    #[inline]
+    pub fn new() -> Self {
+        Self(vec![O::zero()])
+    }
+
+    /// Returns an [`Offsets`] whose all lengths are zero.
+    #[inline]
+    pub fn new_zeroed(length: usize) -> Self {
+        Self(vec![O::zero(); length + 1])
+    }
+
+    /// Creates a new [`Offsets`] from an iterator of lengths
+    #[inline]
+    pub fn try_from_iter<I: IntoIterator<Item = usize>>(iter: I) -> Result<Self, Error> {
+        let iterator = iter.into_iter();
+        let (lower, _) = iterator.size_hint();
+        let mut offsets = Self::with_capacity(lower);
+        for item in iterator {
+            offsets.try_push_usize(item)?
+        }
+        Ok(offsets)
+    }
+
+    /// Returns a new [`Offsets`] with a capacity, allocating at least `capacity + 1` entries.
+    pub fn with_capacity(capacity: usize) -> Self {
+        let mut offsets = Vec::with_capacity(capacity + 1);
+        offsets.push(O::zero());
+        Self(offsets)
+    }
+
+    /// Returns the capacity of [`Offsets`].
+    pub fn capacity(&self) -> usize {
+        self.0.capacity() - 1
+    }
+
+    /// Reserves `additional` entries.
+    pub fn reserve(&mut self, additional: usize) {
+        self.0.reserve(additional);
+    }
+
+    /// Shrinks the capacity of self to fit.
+    pub fn shrink_to_fit(&mut self) {
+        self.0.shrink_to_fit();
+    }
+
+    /// Pushes a new element with a given length.
+    /// # Error
+    /// This function errors iff the new last item is larger than what `O` supports.
+    /// # Panic
+    /// This function asserts that `length > 0`.
+    #[inline]
+    pub fn try_push(&mut self, length: O) -> Result<(), Error> {
+        let old_length = self.last();
+        assert!(length >= O::zero());
+        let new_length = old_length.checked_add(&length).ok_or(Error::Overflow)?;
+        self.0.push(new_length);
+        Ok(())
+    }
+
+    /// Pushes a new element with a given length.
+    /// # Error
+    /// This function errors iff the new last item is larger than what `O` supports.
+    /// # Implementation
+    /// This function:
+    /// * checks that this length does not overflow
+    #[inline]
+    pub fn try_push_usize(&mut self, length: usize) -> Result<(), Error> {
+        let length = O::from_usize(length).ok_or(Error::Overflow)?;
+
+        let old_length = self.last();
+        let new_length = old_length.checked_add(&length).ok_or(Error::Overflow)?;
+        self.0.push(new_length);
+        Ok(())
+    }
+
+    /// Returns [`Offsets`] assuming that `offsets` fulfills its invariants
+    /// # Safety
+    /// This is safe iff the invariants of this struct are guaranteed in `offsets`.
+    #[inline]
+    pub unsafe fn new_unchecked(offsets: Vec<O>) -> Self {
+        Self(offsets)
+    }
+
+    /// Returns the last offset of this container.
+    #[inline]
+    pub fn last(&self) -> &O {
+        match self.0.last() {
+            Some(element) => element,
+            None => unsafe { unreachable_unchecked() },
+        }
+    }
+
+    /// Returns a range (start, end) corresponding to the position `index`
+    /// # Panic
+    /// This function panics iff `index >= self.len()`
+    #[inline]
+    pub fn start_end(&self, index: usize) -> (usize, usize) {
+        // soundness: the invariant of the function
+        assert!(index < self.len_proxy());
+        unsafe { self.start_end_unchecked(index) }
+    }
+
+    /// Returns a range (start, end) corresponding to the position `index`
+    /// # Safety
+    /// `index` must be `< self.len()`
+    #[inline]
+    pub unsafe fn start_end_unchecked(&self, index: usize) -> (usize, usize) {
+        // soundness: the invariant of the function
+        let start = self.0.get_unchecked(index).to_usize();
+        let end = self.0.get_unchecked(index + 1).to_usize();
+        (start, end)
+    }
+
+    /// Returns the length an array with these offsets would be.
+    #[inline]
+    pub fn len_proxy(&self) -> usize {
+        self.0.len() - 1
+    }
+
+    #[inline]
+    /// Returns the number of offsets in this container.
+    pub fn len(&self) -> usize {
+        self.0.len()
+    }
+
+    /// Returns the byte slice stored in this buffer
+    #[inline]
+    pub fn as_slice(&self) -> &[O] {
+        self.0.as_slice()
+    }
+
+    /// Pops the last element
+    #[inline]
+    pub fn pop(&mut self) -> Option<O> {
+        if self.len_proxy() == 0 {
+            None
+        } else {
+            self.0.pop()
+        }
+    }
+
+    /// Extends itself with `additional` elements equal to the last offset.
+    /// This is useful to extend offsets with empty values, e.g. for null slots.
+    #[inline]
+    pub fn extend_constant(&mut self, additional: usize) {
+        let offset = *self.last();
+        if additional == 1 {
+            self.0.push(offset)
+        } else {
+            self.0.resize(self.len() + additional, offset)
+        }
+    }
+
+    /// Try to create a new [`Offsets`] from a sequence of `lengths`
+    /// # Errors
+    /// This function errors iff this operation overflows for the maximum value of `O`.
+    #[inline]
+    pub fn try_from_lengths<I: Iterator<Item = usize>>(lengths: I) -> Result<Self, Error> {
+        let mut self_ = Self::with_capacity(lengths.size_hint().0);
+        self_.try_extend_from_lengths(lengths)?;
+        Ok(self_)
+    }
+
+    /// Try extend from an iterator of lengths
+    /// # Errors
+    /// This function errors iff this operation overflows for the maximum value of `O`.
+    #[inline]
+    pub fn try_extend_from_lengths<I: Iterator<Item = usize>>(
+        &mut self,
+        lengths: I,
+    ) -> Result<(), Error> {
+        let mut total_length = 0;
+        let mut offset = *self.last();
+        let original_offset = offset.to_usize();
+
+        let lengths = lengths.map(|length| {
+            total_length += length;
+            O::from_as_usize(length)
+        });
+
+        let offsets = lengths.map(|length| {
+            offset += length; // this may overflow, checked below
+            offset
+        });
+        self.0.extend(offsets);
+
+        let last_offset = original_offset
+            .checked_add(total_length)
+            .ok_or(Error::Overflow)?;
+        O::from_usize(last_offset).ok_or(Error::Overflow)?;
+        Ok(())
+    }
+
+    /// Extends itself from another [`Offsets`]
+    /// # Errors
+    /// This function errors iff this operation overflows for the maximum value of `O`.
+    pub fn try_extend_from_self(&mut self, other: &Self) -> Result<(), Error> {
+        let mut length = *self.last();
+        let other_length = *other.last();
+        // check if the operation would overflow
+        length.checked_add(&other_length).ok_or(Error::Overflow)?;
+
+        let lengths = other.as_slice().windows(2).map(|w| w[1] - w[0]);
+        let offsets = lengths.map(|new_length| {
+            length += new_length;
+            length
+        });
+        self.0.extend(offsets);
+        Ok(())
+    }
+
+    /// Extends itself from another [`Offsets`] sliced by `start, length`
+    /// # Errors
+    /// This function errors iff this operation overflows for the maximum value of `O`.
+    pub fn try_extend_from_slice(
+        &mut self,
+        other: &OffsetsBuffer<O>,
+        start: usize,
+        length: usize,
+    ) -> Result<(), Error> {
+        if length == 0 {
+            return Ok(());
+        }
+        let other = &other.0[start..start + length + 1];
+        let other_length = other.last().expect("Length to be non-zero");
+        let mut length = *self.last();
+        // check if the operation would overflow
+        length.checked_add(other_length).ok_or(Error::Overflow)?;
+
+        let lengths = other.windows(2).map(|w| w[1] - w[0]);
+        let offsets = lengths.map(|new_length| {
+            length += new_length;
+            length
+        });
+        self.0.extend(offsets);
+        Ok(())
+    }
+
+    /// Returns the inner [`Vec`].
+    #[inline]
+    pub fn into_inner(self) -> Vec<O> {
+        self.0
+    }
+}
+
+/// Checks that `offsets` is monotonically increasing.
+fn try_check_offsets<O: Offset>(offsets: &[O]) -> Result<(), Error> {
+    // this code is carefully constructed to auto-vectorize, don't change naively!
+    match offsets.first() {
+        None => Err(Error::oos("offsets must have at least one element")),
+        Some(first) => {
+            if *first < O::zero() {
+                return Err(Error::oos("offsets must be larger than 0"));
+            }
+            let mut previous = *first;
+            let mut any_invalid = false;
+
+            // This loop will auto-vectorize because there is not any break,
+            // an invalid value will be returned once the whole offsets buffer is processed.
+            for offset in offsets {
+                if previous > *offset {
+                    any_invalid = true
+                }
+                previous = *offset;
+            }
+
+            if any_invalid {
+                Err(Error::oos("offsets must be monotonically increasing"))
+            } else {
+                Ok(())
+            }
+        },
+    }
+}
+
+/// A wrapper type of [`Buffer<O>`] that is guaranteed to:
+/// * Always contain an element
+/// * Every element is `>= 0`
+/// * element at position `i` is >= than element at position `i-1`.
+#[derive(Clone, PartialEq, Debug)]
+pub struct OffsetsBuffer<O: Offset>(Buffer<O>);
+
+impl<O: Offset> Default for OffsetsBuffer<O> {
+    #[inline]
+    fn default() -> Self {
+        Self(vec![O::zero()].into())
+    }
+}
+
+impl<O: Offset> OffsetsBuffer<O> {
+    /// # Safety
+    /// This is safe iff the invariants of this struct are guaranteed in `offsets`.
+    #[inline]
+    pub unsafe fn new_unchecked(offsets: Buffer<O>) -> Self {
+        Self(offsets)
+    }
+
+    /// Returns an empty [`OffsetsBuffer`] (i.e. with a single element, the zero)
+    #[inline]
+    pub fn new() -> Self {
+        Self(vec![O::zero()].into())
+    }
+
+    /// Copy-on-write API to convert [`OffsetsBuffer`] into [`Offsets`].
+    #[inline]
+    pub fn into_mut(self) -> either::Either<Self, Offsets<O>> {
+        self.0
+            .into_mut()
+            // Safety: Offsets and OffsetsBuffer share invariants
+            .map_right(|offsets| unsafe { Offsets::new_unchecked(offsets) })
+            .map_left(Self)
+    }
+
+    /// Returns a reference to its internal [`Buffer`].
+    #[inline]
+    pub fn buffer(&self) -> &Buffer<O> {
+        &self.0
+    }
+
+    /// Returns the length an array with these offsets would be.
+    #[inline]
+    pub fn len_proxy(&self) -> usize {
+        self.0.len() - 1
+    }
+
+    /// Returns the number of offsets in this container.
+    #[inline]
+    pub fn len(&self) -> usize {
+        self.0.len()
+    }
+
+    /// Returns the byte slice stored in this buffer
+    #[inline]
+    pub fn as_slice(&self) -> &[O] {
+        self.0.as_slice()
+    }
+
+    /// Returns the range of the offsets.
+    #[inline]
+    pub fn range(&self) -> O {
+        *self.last() - *self.first()
+    }
+
+    /// Returns the first offset.
+    #[inline]
+    pub fn first(&self) -> &O {
+        match self.0.first() {
+            Some(element) => element,
+            None => unsafe { unreachable_unchecked() },
+        }
+    }
+
+    /// Returns the last offset.
+    #[inline]
+    pub fn last(&self) -> &O {
+        match self.0.last() {
+            Some(element) => element,
+            None => unsafe { unreachable_unchecked() },
+        }
+    }
+
+    /// Returns a range (start, end) corresponding to the position `index`
+    /// # Panic
+    /// This function panics iff `index >= self.len()`
+    #[inline]
+    pub fn start_end(&self, index: usize) -> (usize, usize) {
+        // soundness: the invariant of the function
+        assert!(index < self.len_proxy());
+        unsafe { self.start_end_unchecked(index) }
+    }
+
+    /// Returns a range (start, end) corresponding to the position `index`
+    /// # Safety
+    /// `index` must be `< self.len()`
+    #[inline]
+    pub unsafe fn start_end_unchecked(&self, index: usize) -> (usize, usize) {
+        // soundness: the invariant of the function
+        let start = self.0.get_unchecked(index).to_usize();
+        let end = self.0.get_unchecked(index + 1).to_usize();
+        (start, end)
+    }
+
+    /// Slices this [`OffsetsBuffer`].
+    /// # Panics
+    /// Panics if `offset + length` is larger than `len`
+    /// or `length == 0`.
+    #[inline]
+    pub fn slice(&mut self, offset: usize, length: usize) {
+        assert!(length > 0);
+        self.0.slice(offset, length);
+    }
+
+    /// Slices this [`OffsetsBuffer`] starting at `offset`.
+    /// # Safety
+    /// The caller must ensure `offset + length <= self.len()`
+    #[inline]
+    pub unsafe fn slice_unchecked(&mut self, offset: usize, length: usize) {
+        self.0.slice_unchecked(offset, length);
+    }
+
+    /// Returns an iterator with the lengths of the offsets
+    #[inline]
+    pub fn lengths(&self) -> impl Iterator<Item = usize> + '_ {
+        self.0.windows(2).map(|w| (w[1] - w[0]).to_usize())
+    }
+
+    /// Returns the inner [`Buffer`].
+    #[inline]
+    pub fn into_inner(self) -> Buffer<O> {
+        self.0
+    }
+}
+
+impl From<&OffsetsBuffer<i32>> for OffsetsBuffer<i64> {
+    fn from(offsets: &OffsetsBuffer<i32>) -> Self {
+        // this conversion is lossless and uphelds all invariants
+        Self(
+            offsets
+                .buffer()
+                .iter()
+                .map(|x| *x as i64)
+                .collect::<Vec<_>>()
+                .into(),
+        )
+    }
+}
+
+impl TryFrom<&OffsetsBuffer<i64>> for OffsetsBuffer<i32> {
+    type Error = Error;
+
+    fn try_from(offsets: &OffsetsBuffer<i64>) -> Result<Self, Self::Error> {
+        i32::try_from(*offsets.last()).map_err(|_| Error::Overflow)?;
+
+        // this conversion is lossless and uphelds all invariants
+        Ok(Self(
+            offsets
+                .buffer()
+                .iter()
+                .map(|x| *x as i32)
+                .collect::<Vec<_>>()
+                .into(),
+        ))
+    }
+}
+
+impl From<Offsets<i32>> for Offsets<i64> {
+    fn from(offsets: Offsets<i32>) -> Self {
+        // this conversion is lossless and uphelds all invariants
+        Self(
+            offsets
+                .as_slice()
+                .iter()
+                .map(|x| *x as i64)
+                .collect::<Vec<_>>(),
+        )
+    }
+}
+
+impl TryFrom<Offsets<i64>> for Offsets<i32> {
+    type Error = Error;
+
+    fn try_from(offsets: Offsets<i64>) -> Result<Self, Self::Error> {
+        i32::try_from(*offsets.last()).map_err(|_| Error::Overflow)?;
+
+        // this conversion is lossless and uphelds all invariants
+        Ok(Self(
+            offsets
+                .as_slice()
+                .iter()
+                .map(|x| *x as i32)
+                .collect::<Vec<_>>(),
+        ))
+    }
+}
+
+impl<O: Offset> std::ops::Deref for OffsetsBuffer<O> {
+    type Target = [O];
+
+    #[inline]
+    fn deref(&self) -> &[O] {
+        self.0.as_slice()
+    }
+}
diff --git a/crates/nano-arrow/src/scalar/README.md b/crates/nano-arrow/src/scalar/README.md
new file mode 100644
index 000000000000..b780081b6131
--- /dev/null
+++ b/crates/nano-arrow/src/scalar/README.md
@@ -0,0 +1,28 @@
+# Scalar API
+
+Design choices:
+
+### `Scalar` is trait object
+
+There are three reasons:
+
+- a scalar should have a small memory footprint, which an enum would not ensure given the different physical types available.
+- forward-compatibility: a new entry on an `enum` is backward-incompatible
+- do not expose implementation details to users (reduce the surface of the public API)
+
+### `Scalar` MUST contain nullability information
+
+This is to be aligned with the general notion of arrow's `Array`.
+
+This API is a companion to the `Array`, and follows the same design as `Array`.
+Specifically, a `Scalar` is a trait object that can be downcasted to concrete implementations.
+
+Like `Array`, `Scalar` implements
+
+- `data_type`, which is used to perform the correct downcast
+- `is_valid`, to tell whether the scalar is null or not
+
+### There is one implementation per arrows' physical type
+
+- Reduces the number of `match` that users need to write
+- Allows casting of logical types without changing the underlying physical type
diff --git a/crates/nano-arrow/src/scalar/binary.rs b/crates/nano-arrow/src/scalar/binary.rs
new file mode 100644
index 000000000000..0d33f6f8f7e4
--- /dev/null
+++ b/crates/nano-arrow/src/scalar/binary.rs
@@ -0,0 +1,55 @@
+use super::Scalar;
+use crate::datatypes::DataType;
+use crate::offset::Offset;
+
+/// The [`Scalar`] implementation of binary ([`Option<Vec<u8>>`]).
+#[derive(Debug, Clone, PartialEq, Eq)]
+pub struct BinaryScalar<O: Offset> {
+    value: Option<Vec<u8>>,
+    phantom: std::marker::PhantomData<O>,
+}
+
+impl<O: Offset> BinaryScalar<O> {
+    /// Returns a new [`BinaryScalar`].
+    #[inline]
+    pub fn new<P: Into<Vec<u8>>>(value: Option<P>) -> Self {
+        Self {
+            value: value.map(|x| x.into()),
+            phantom: std::marker::PhantomData,
+        }
+    }
+
+    /// Its value
+    #[inline]
+    pub fn value(&self) -> Option<&[u8]> {
+        self.value.as_ref().map(|x| x.as_ref())
+    }
+}
+
+impl<O: Offset, P: Into<Vec<u8>>> From<Option<P>> for BinaryScalar<O> {
+    #[inline]
+    fn from(v: Option<P>) -> Self {
+        Self::new(v)
+    }
+}
+
+impl<O: Offset> Scalar for BinaryScalar<O> {
+    #[inline]
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    #[inline]
+    fn is_valid(&self) -> bool {
+        self.value.is_some()
+    }
+
+    #[inline]
+    fn data_type(&self) -> &DataType {
+        if O::IS_LARGE {
+            &DataType::LargeBinary
+        } else {
+            &DataType::Binary
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/scalar/boolean.rs b/crates/nano-arrow/src/scalar/boolean.rs
new file mode 100644
index 000000000000..aa7d435859af
--- /dev/null
+++ b/crates/nano-arrow/src/scalar/boolean.rs
@@ -0,0 +1,46 @@
+use super::Scalar;
+use crate::datatypes::DataType;
+
+/// The [`Scalar`] implementation of a boolean.
+#[derive(Debug, Clone, PartialEq, Eq)]
+pub struct BooleanScalar {
+    value: Option<bool>,
+}
+
+impl BooleanScalar {
+    /// Returns a new [`BooleanScalar`]
+    #[inline]
+    pub fn new(value: Option<bool>) -> Self {
+        Self { value }
+    }
+
+    /// The value
+    #[inline]
+    pub fn value(&self) -> Option<bool> {
+        self.value
+    }
+}
+
+impl Scalar for BooleanScalar {
+    #[inline]
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    #[inline]
+    fn is_valid(&self) -> bool {
+        self.value.is_some()
+    }
+
+    #[inline]
+    fn data_type(&self) -> &DataType {
+        &DataType::Boolean
+    }
+}
+
+impl From<Option<bool>> for BooleanScalar {
+    #[inline]
+    fn from(v: Option<bool>) -> Self {
+        Self::new(v)
+    }
+}
diff --git a/crates/nano-arrow/src/scalar/dictionary.rs b/crates/nano-arrow/src/scalar/dictionary.rs
new file mode 100644
index 000000000000..97e3e5916f52
--- /dev/null
+++ b/crates/nano-arrow/src/scalar/dictionary.rs
@@ -0,0 +1,54 @@
+use std::any::Any;
+
+use super::Scalar;
+use crate::array::*;
+use crate::datatypes::DataType;
+
+/// The [`DictionaryArray`] equivalent of [`Array`] for [`Scalar`].
+#[derive(Debug, Clone)]
+pub struct DictionaryScalar<K: DictionaryKey> {
+    value: Option<Box<dyn Scalar>>,
+    phantom: std::marker::PhantomData<K>,
+    data_type: DataType,
+}
+
+impl<K: DictionaryKey> PartialEq for DictionaryScalar<K> {
+    fn eq(&self, other: &Self) -> bool {
+        (self.data_type == other.data_type) && (self.value.as_ref() == other.value.as_ref())
+    }
+}
+
+impl<K: DictionaryKey> DictionaryScalar<K> {
+    /// returns a new [`DictionaryScalar`]
+    /// # Panics
+    /// iff
+    /// * the `data_type` is not `List` or `LargeList` (depending on this scalar's offset `O`)
+    /// * the child of the `data_type` is not equal to the `values`
+    #[inline]
+    pub fn new(data_type: DataType, value: Option<Box<dyn Scalar>>) -> Self {
+        Self {
+            value,
+            phantom: std::marker::PhantomData,
+            data_type,
+        }
+    }
+
+    /// The values of the [`DictionaryScalar`]
+    pub fn value(&self) -> Option<&Box<dyn Scalar>> {
+        self.value.as_ref()
+    }
+}
+
+impl<K: DictionaryKey> Scalar for DictionaryScalar<K> {
+    fn as_any(&self) -> &dyn Any {
+        self
+    }
+
+    fn is_valid(&self) -> bool {
+        self.value.is_some()
+    }
+
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+}
diff --git a/crates/nano-arrow/src/scalar/equal.rs b/crates/nano-arrow/src/scalar/equal.rs
new file mode 100644
index 000000000000..34f98d23640d
--- /dev/null
+++ b/crates/nano-arrow/src/scalar/equal.rs
@@ -0,0 +1,57 @@
+use std::sync::Arc;
+
+use super::*;
+use crate::datatypes::PhysicalType;
+
+impl PartialEq for dyn Scalar + '_ {
+    fn eq(&self, that: &dyn Scalar) -> bool {
+        equal(self, that)
+    }
+}
+
+impl PartialEq<dyn Scalar> for Arc<dyn Scalar + '_> {
+    fn eq(&self, that: &dyn Scalar) -> bool {
+        equal(&**self, that)
+    }
+}
+
+impl PartialEq<dyn Scalar> for Box<dyn Scalar + '_> {
+    fn eq(&self, that: &dyn Scalar) -> bool {
+        equal(&**self, that)
+    }
+}
+
+macro_rules! dyn_eq {
+    ($ty:ty, $lhs:expr, $rhs:expr) => {{
+        let lhs = $lhs.as_any().downcast_ref::<$ty>().unwrap();
+        let rhs = $rhs.as_any().downcast_ref::<$ty>().unwrap();
+        lhs == rhs
+    }};
+}
+
+fn equal(lhs: &dyn Scalar, rhs: &dyn Scalar) -> bool {
+    if lhs.data_type() != rhs.data_type() {
+        return false;
+    }
+
+    use PhysicalType::*;
+    match lhs.data_type().to_physical_type() {
+        Null => dyn_eq!(NullScalar, lhs, rhs),
+        Boolean => dyn_eq!(BooleanScalar, lhs, rhs),
+        Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+            dyn_eq!(PrimitiveScalar<$T>, lhs, rhs)
+        }),
+        LargeUtf8 => dyn_eq!(Utf8Scalar<i64>, lhs, rhs),
+        LargeBinary => dyn_eq!(BinaryScalar<i64>, lhs, rhs),
+        LargeList => dyn_eq!(ListScalar<i64>, lhs, rhs),
+        Dictionary(key_type) => match_integer_type!(key_type, |$T| {
+            dyn_eq!(DictionaryScalar<$T>, lhs, rhs)
+        }),
+        Struct => dyn_eq!(StructScalar, lhs, rhs),
+        FixedSizeBinary => dyn_eq!(FixedSizeBinaryScalar, lhs, rhs),
+        FixedSizeList => dyn_eq!(FixedSizeListScalar, lhs, rhs),
+        Union => dyn_eq!(UnionScalar, lhs, rhs),
+        Map => dyn_eq!(MapScalar, lhs, rhs),
+        _ => unimplemented!(),
+    }
+}
diff --git a/crates/nano-arrow/src/scalar/fixed_size_binary.rs b/crates/nano-arrow/src/scalar/fixed_size_binary.rs
new file mode 100644
index 000000000000..d8fbb96bac2c
--- /dev/null
+++ b/crates/nano-arrow/src/scalar/fixed_size_binary.rs
@@ -0,0 +1,58 @@
+use super::Scalar;
+use crate::datatypes::DataType;
+
+#[derive(Debug, Clone, PartialEq, Eq)]
+/// The [`Scalar`] implementation of fixed size binary ([`Option<Box<[u8]>>`]).
+pub struct FixedSizeBinaryScalar {
+    value: Option<Box<[u8]>>,
+    data_type: DataType,
+}
+
+impl FixedSizeBinaryScalar {
+    /// Returns a new [`FixedSizeBinaryScalar`].
+    /// # Panics
+    /// iff
+    /// * the `data_type` is not `FixedSizeBinary`
+    /// * the size of child binary is not equal
+    #[inline]
+    pub fn new<P: Into<Vec<u8>>>(data_type: DataType, value: Option<P>) -> Self {
+        assert_eq!(
+            data_type.to_physical_type(),
+            crate::datatypes::PhysicalType::FixedSizeBinary
+        );
+        Self {
+            value: value.map(|x| {
+                let x: Vec<u8> = x.into();
+                assert_eq!(
+                    data_type.to_logical_type(),
+                    &DataType::FixedSizeBinary(x.len())
+                );
+                x.into_boxed_slice()
+            }),
+            data_type,
+        }
+    }
+
+    /// Its value
+    #[inline]
+    pub fn value(&self) -> Option<&[u8]> {
+        self.value.as_ref().map(|x| x.as_ref())
+    }
+}
+
+impl Scalar for FixedSizeBinaryScalar {
+    #[inline]
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    #[inline]
+    fn is_valid(&self) -> bool {
+        self.value.is_some()
+    }
+
+    #[inline]
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+}
diff --git a/crates/nano-arrow/src/scalar/fixed_size_list.rs b/crates/nano-arrow/src/scalar/fixed_size_list.rs
new file mode 100644
index 000000000000..b8333c02c347
--- /dev/null
+++ b/crates/nano-arrow/src/scalar/fixed_size_list.rs
@@ -0,0 +1,60 @@
+use std::any::Any;
+
+use super::Scalar;
+use crate::array::*;
+use crate::datatypes::DataType;
+
+/// The scalar equivalent of [`FixedSizeListArray`]. Like [`FixedSizeListArray`], this struct holds a dynamically-typed
+/// [`Array`]. The only difference is that this has only one element.
+#[derive(Debug, Clone)]
+pub struct FixedSizeListScalar {
+    values: Option<Box<dyn Array>>,
+    data_type: DataType,
+}
+
+impl PartialEq for FixedSizeListScalar {
+    fn eq(&self, other: &Self) -> bool {
+        (self.data_type == other.data_type)
+            && (self.values.is_some() == other.values.is_some())
+            && ((self.values.is_none()) | (self.values.as_ref() == other.values.as_ref()))
+    }
+}
+
+impl FixedSizeListScalar {
+    /// returns a new [`FixedSizeListScalar`]
+    /// # Panics
+    /// iff
+    /// * the `data_type` is not `FixedSizeList`
+    /// * the child of the `data_type` is not equal to the `values`
+    /// * the size of child array is not equal
+    #[inline]
+    pub fn new(data_type: DataType, values: Option<Box<dyn Array>>) -> Self {
+        let (field, size) = FixedSizeListArray::get_child_and_size(&data_type);
+        let inner_data_type = field.data_type();
+        let values = values.map(|x| {
+            assert_eq!(inner_data_type, x.data_type());
+            assert_eq!(size, x.len());
+            x
+        });
+        Self { values, data_type }
+    }
+
+    /// The values of the [`FixedSizeListScalar`]
+    pub fn values(&self) -> Option<&Box<dyn Array>> {
+        self.values.as_ref()
+    }
+}
+
+impl Scalar for FixedSizeListScalar {
+    fn as_any(&self) -> &dyn Any {
+        self
+    }
+
+    fn is_valid(&self) -> bool {
+        self.values.is_some()
+    }
+
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+}
diff --git a/crates/nano-arrow/src/scalar/list.rs b/crates/nano-arrow/src/scalar/list.rs
new file mode 100644
index 000000000000..d82bf02768bf
--- /dev/null
+++ b/crates/nano-arrow/src/scalar/list.rs
@@ -0,0 +1,68 @@
+use std::any::Any;
+
+use super::Scalar;
+use crate::array::*;
+use crate::datatypes::DataType;
+use crate::offset::Offset;
+
+/// The scalar equivalent of [`ListArray`]. Like [`ListArray`], this struct holds a dynamically-typed
+/// [`Array`]. The only difference is that this has only one element.
+#[derive(Debug, Clone)]
+pub struct ListScalar<O: Offset> {
+    values: Box<dyn Array>,
+    is_valid: bool,
+    phantom: std::marker::PhantomData<O>,
+    data_type: DataType,
+}
+
+impl<O: Offset> PartialEq for ListScalar<O> {
+    fn eq(&self, other: &Self) -> bool {
+        (self.data_type == other.data_type)
+            && (self.is_valid == other.is_valid)
+            && ((!self.is_valid) | (self.values.as_ref() == other.values.as_ref()))
+    }
+}
+
+impl<O: Offset> ListScalar<O> {
+    /// returns a new [`ListScalar`]
+    /// # Panics
+    /// iff
+    /// * the `data_type` is not `List` or `LargeList` (depending on this scalar's offset `O`)
+    /// * the child of the `data_type` is not equal to the `values`
+    #[inline]
+    pub fn new(data_type: DataType, values: Option<Box<dyn Array>>) -> Self {
+        let inner_data_type = ListArray::<O>::get_child_type(&data_type);
+        let (is_valid, values) = match values {
+            Some(values) => {
+                assert_eq!(inner_data_type, values.data_type());
+                (true, values)
+            },
+            None => (false, new_empty_array(inner_data_type.clone())),
+        };
+        Self {
+            values,
+            is_valid,
+            phantom: std::marker::PhantomData,
+            data_type,
+        }
+    }
+
+    /// The values of the [`ListScalar`]
+    pub fn values(&self) -> &Box<dyn Array> {
+        &self.values
+    }
+}
+
+impl<O: Offset> Scalar for ListScalar<O> {
+    fn as_any(&self) -> &dyn Any {
+        self
+    }
+
+    fn is_valid(&self) -> bool {
+        self.is_valid
+    }
+
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+}
diff --git a/crates/nano-arrow/src/scalar/map.rs b/crates/nano-arrow/src/scalar/map.rs
new file mode 100644
index 000000000000..90145fb6a30f
--- /dev/null
+++ b/crates/nano-arrow/src/scalar/map.rs
@@ -0,0 +1,66 @@
+use std::any::Any;
+
+use super::Scalar;
+use crate::array::*;
+use crate::datatypes::DataType;
+
+/// The scalar equivalent of [`MapArray`]. Like [`MapArray`], this struct holds a dynamically-typed
+/// [`Array`]. The only difference is that this has only one element.
+#[derive(Debug, Clone)]
+pub struct MapScalar {
+    values: Box<dyn Array>,
+    is_valid: bool,
+    data_type: DataType,
+}
+
+impl PartialEq for MapScalar {
+    fn eq(&self, other: &Self) -> bool {
+        (self.data_type == other.data_type)
+            && (self.is_valid == other.is_valid)
+            && ((!self.is_valid) | (self.values.as_ref() == other.values.as_ref()))
+    }
+}
+
+impl MapScalar {
+    /// returns a new [`MapScalar`]
+    /// # Panics
+    /// iff
+    /// * the `data_type` is not `Map`
+    /// * the child of the `data_type` is not equal to the `values`
+    #[inline]
+    pub fn new(data_type: DataType, values: Option<Box<dyn Array>>) -> Self {
+        let inner_field = MapArray::try_get_field(&data_type).unwrap();
+        let inner_data_type = inner_field.data_type();
+        let (is_valid, values) = match values {
+            Some(values) => {
+                assert_eq!(inner_data_type, values.data_type());
+                (true, values)
+            },
+            None => (false, new_empty_array(inner_data_type.clone())),
+        };
+        Self {
+            values,
+            is_valid,
+            data_type,
+        }
+    }
+
+    /// The values of the [`MapScalar`]
+    pub fn values(&self) -> &Box<dyn Array> {
+        &self.values
+    }
+}
+
+impl Scalar for MapScalar {
+    fn as_any(&self) -> &dyn Any {
+        self
+    }
+
+    fn is_valid(&self) -> bool {
+        self.is_valid
+    }
+
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+}
diff --git a/crates/nano-arrow/src/scalar/mod.rs b/crates/nano-arrow/src/scalar/mod.rs
new file mode 100644
index 000000000000..7b78b93a44f2
--- /dev/null
+++ b/crates/nano-arrow/src/scalar/mod.rs
@@ -0,0 +1,187 @@
+//! contains the [`Scalar`] trait object representing individual items of [`Array`](crate::array::Array)s,
+//! as well as concrete implementations such as [`BooleanScalar`].
+use std::any::Any;
+
+use crate::array::*;
+use crate::datatypes::*;
+
+mod dictionary;
+pub use dictionary::*;
+mod equal;
+mod primitive;
+pub use primitive::*;
+mod utf8;
+pub use utf8::*;
+mod binary;
+pub use binary::*;
+mod boolean;
+pub use boolean::*;
+mod list;
+pub use list::*;
+mod map;
+pub use map::*;
+mod null;
+pub use null::*;
+mod struct_;
+pub use struct_::*;
+mod fixed_size_list;
+pub use fixed_size_list::*;
+mod fixed_size_binary;
+pub use fixed_size_binary::*;
+mod union;
+pub use union::UnionScalar;
+
+/// Trait object declaring an optional value with a [`DataType`].
+/// This strait is often used in APIs that accept multiple scalar types.
+pub trait Scalar: std::fmt::Debug + Send + Sync + dyn_clone::DynClone + 'static {
+    /// convert itself to
+    fn as_any(&self) -> &dyn Any;
+
+    /// whether it is valid
+    fn is_valid(&self) -> bool;
+
+    /// the logical type.
+    fn data_type(&self) -> &DataType;
+}
+
+dyn_clone::clone_trait_object!(Scalar);
+
+macro_rules! dyn_new_utf8 {
+    ($array:expr, $index:expr, $type:ty) => {{
+        let array = $array.as_any().downcast_ref::<Utf8Array<$type>>().unwrap();
+        let value = if array.is_valid($index) {
+            Some(array.value($index))
+        } else {
+            None
+        };
+        Box::new(Utf8Scalar::<$type>::new(value))
+    }};
+}
+
+macro_rules! dyn_new_binary {
+    ($array:expr, $index:expr, $type:ty) => {{
+        let array = $array
+            .as_any()
+            .downcast_ref::<BinaryArray<$type>>()
+            .unwrap();
+        let value = if array.is_valid($index) {
+            Some(array.value($index))
+        } else {
+            None
+        };
+        Box::new(BinaryScalar::<$type>::new(value))
+    }};
+}
+
+macro_rules! dyn_new_list {
+    ($array:expr, $index:expr, $type:ty) => {{
+        let array = $array.as_any().downcast_ref::<ListArray<$type>>().unwrap();
+        let value = if array.is_valid($index) {
+            Some(array.value($index).into())
+        } else {
+            None
+        };
+        Box::new(ListScalar::<$type>::new(array.data_type().clone(), value))
+    }};
+}
+
+/// creates a new [`Scalar`] from an [`Array`].
+pub fn new_scalar(array: &dyn Array, index: usize) -> Box<dyn Scalar> {
+    use PhysicalType::*;
+    match array.data_type().to_physical_type() {
+        Null => Box::new(NullScalar::new()),
+        Boolean => {
+            let array = array.as_any().downcast_ref::<BooleanArray>().unwrap();
+            let value = if array.is_valid(index) {
+                Some(array.value(index))
+            } else {
+                None
+            };
+            Box::new(BooleanScalar::new(value))
+        },
+        Primitive(primitive) => with_match_primitive_type!(primitive, |$T| {
+            let array = array
+                .as_any()
+                .downcast_ref::<PrimitiveArray<$T>>()
+                .unwrap();
+            let value = if array.is_valid(index) {
+                Some(array.value(index))
+            } else {
+                None
+            };
+            Box::new(PrimitiveScalar::new(array.data_type().clone(), value))
+        }),
+        Utf8 => dyn_new_utf8!(array, index, i32),
+        LargeUtf8 => dyn_new_utf8!(array, index, i64),
+        Binary => dyn_new_binary!(array, index, i32),
+        LargeBinary => dyn_new_binary!(array, index, i64),
+        List => dyn_new_list!(array, index, i32),
+        LargeList => dyn_new_list!(array, index, i64),
+        Struct => {
+            let array = array.as_any().downcast_ref::<StructArray>().unwrap();
+            if array.is_valid(index) {
+                let values = array
+                    .values()
+                    .iter()
+                    .map(|x| new_scalar(x.as_ref(), index))
+                    .collect();
+                Box::new(StructScalar::new(array.data_type().clone(), Some(values)))
+            } else {
+                Box::new(StructScalar::new(array.data_type().clone(), None))
+            }
+        },
+        FixedSizeBinary => {
+            let array = array
+                .as_any()
+                .downcast_ref::<FixedSizeBinaryArray>()
+                .unwrap();
+            let value = if array.is_valid(index) {
+                Some(array.value(index))
+            } else {
+                None
+            };
+            Box::new(FixedSizeBinaryScalar::new(array.data_type().clone(), value))
+        },
+        FixedSizeList => {
+            let array = array.as_any().downcast_ref::<FixedSizeListArray>().unwrap();
+            let value = if array.is_valid(index) {
+                Some(array.value(index))
+            } else {
+                None
+            };
+            Box::new(FixedSizeListScalar::new(array.data_type().clone(), value))
+        },
+        Union => {
+            let array = array.as_any().downcast_ref::<UnionArray>().unwrap();
+            Box::new(UnionScalar::new(
+                array.data_type().clone(),
+                array.types()[index],
+                array.value(index),
+            ))
+        },
+        Map => {
+            let array = array.as_any().downcast_ref::<MapArray>().unwrap();
+            let value = if array.is_valid(index) {
+                Some(array.value(index))
+            } else {
+                None
+            };
+            Box::new(MapScalar::new(array.data_type().clone(), value))
+        },
+        Dictionary(key_type) => match_integer_type!(key_type, |$T| {
+            let array = array
+                .as_any()
+                .downcast_ref::<DictionaryArray<$T>>()
+                .unwrap();
+            let value = if array.is_valid(index) {
+                Some(array.value(index).into())
+            } else {
+                None
+            };
+            Box::new(DictionaryScalar::<$T>::new(
+                array.data_type().clone(),
+                value,
+            ))
+        }),
+    }
+}
diff --git a/crates/nano-arrow/src/scalar/null.rs b/crates/nano-arrow/src/scalar/null.rs
new file mode 100644
index 000000000000..2de7d7cde55b
--- /dev/null
+++ b/crates/nano-arrow/src/scalar/null.rs
@@ -0,0 +1,37 @@
+use super::Scalar;
+use crate::datatypes::DataType;
+
+/// The representation of a single entry of a [`crate::array::NullArray`].
+#[derive(Debug, Clone, PartialEq, Eq)]
+pub struct NullScalar {}
+
+impl NullScalar {
+    /// A new [`NullScalar`]
+    #[inline]
+    pub fn new() -> Self {
+        Self {}
+    }
+}
+
+impl Default for NullScalar {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl Scalar for NullScalar {
+    #[inline]
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    #[inline]
+    fn is_valid(&self) -> bool {
+        false
+    }
+
+    #[inline]
+    fn data_type(&self) -> &DataType {
+        &DataType::Null
+    }
+}
diff --git a/crates/nano-arrow/src/scalar/primitive.rs b/crates/nano-arrow/src/scalar/primitive.rs
new file mode 100644
index 000000000000..3288708f6755
--- /dev/null
+++ b/crates/nano-arrow/src/scalar/primitive.rs
@@ -0,0 +1,67 @@
+use super::Scalar;
+use crate::datatypes::DataType;
+use crate::error::Error;
+use crate::types::NativeType;
+
+/// The implementation of [`Scalar`] for primitive, semantically equivalent to [`Option<T>`]
+/// with [`DataType`].
+#[derive(Debug, Clone, PartialEq, Eq)]
+pub struct PrimitiveScalar<T: NativeType> {
+    value: Option<T>,
+    data_type: DataType,
+}
+
+impl<T: NativeType> PrimitiveScalar<T> {
+    /// Returns a new [`PrimitiveScalar`].
+    #[inline]
+    pub fn new(data_type: DataType, value: Option<T>) -> Self {
+        if !data_type.to_physical_type().eq_primitive(T::PRIMITIVE) {
+            panic!(
+                "{:?}",
+                Error::InvalidArgumentError(format!(
+                    "Type {} does not support logical type {:?}",
+                    std::any::type_name::<T>(),
+                    data_type
+                ))
+            )
+        }
+        Self { value, data_type }
+    }
+
+    /// Returns the optional value.
+    #[inline]
+    pub fn value(&self) -> &Option<T> {
+        &self.value
+    }
+
+    /// Returns a new `PrimitiveScalar` with the same value but different [`DataType`]
+    /// # Panic
+    /// This function panics if the `data_type` is not valid for self's physical type `T`.
+    pub fn to(self, data_type: DataType) -> Self {
+        Self::new(data_type, self.value)
+    }
+}
+
+impl<T: NativeType> From<Option<T>> for PrimitiveScalar<T> {
+    #[inline]
+    fn from(v: Option<T>) -> Self {
+        Self::new(T::PRIMITIVE.into(), v)
+    }
+}
+
+impl<T: NativeType> Scalar for PrimitiveScalar<T> {
+    #[inline]
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    #[inline]
+    fn is_valid(&self) -> bool {
+        self.value.is_some()
+    }
+
+    #[inline]
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+}
diff --git a/crates/nano-arrow/src/scalar/struct_.rs b/crates/nano-arrow/src/scalar/struct_.rs
new file mode 100644
index 000000000000..29c2c33ba295
--- /dev/null
+++ b/crates/nano-arrow/src/scalar/struct_.rs
@@ -0,0 +1,54 @@
+use super::Scalar;
+use crate::datatypes::DataType;
+
+/// A single entry of a [`crate::array::StructArray`].
+#[derive(Debug, Clone)]
+pub struct StructScalar {
+    values: Vec<Box<dyn Scalar>>,
+    is_valid: bool,
+    data_type: DataType,
+}
+
+impl PartialEq for StructScalar {
+    fn eq(&self, other: &Self) -> bool {
+        (self.data_type == other.data_type)
+            && (self.is_valid == other.is_valid)
+            && ((!self.is_valid) | (self.values == other.values))
+    }
+}
+
+impl StructScalar {
+    /// Returns a new [`StructScalar`]
+    #[inline]
+    pub fn new(data_type: DataType, values: Option<Vec<Box<dyn Scalar>>>) -> Self {
+        let is_valid = values.is_some();
+        Self {
+            values: values.unwrap_or_default(),
+            is_valid,
+            data_type,
+        }
+    }
+
+    /// Returns the values irrespectively of the validity.
+    #[inline]
+    pub fn values(&self) -> &[Box<dyn Scalar>] {
+        &self.values
+    }
+}
+
+impl Scalar for StructScalar {
+    #[inline]
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    #[inline]
+    fn is_valid(&self) -> bool {
+        self.is_valid
+    }
+
+    #[inline]
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+}
diff --git a/crates/nano-arrow/src/scalar/union.rs b/crates/nano-arrow/src/scalar/union.rs
new file mode 100644
index 000000000000..987e9f4e6044
--- /dev/null
+++ b/crates/nano-arrow/src/scalar/union.rs
@@ -0,0 +1,51 @@
+use super::Scalar;
+use crate::datatypes::DataType;
+
+/// A single entry of a [`crate::array::UnionArray`].
+#[derive(Debug, Clone, PartialEq)]
+pub struct UnionScalar {
+    value: Box<dyn Scalar>,
+    type_: i8,
+    data_type: DataType,
+}
+
+impl UnionScalar {
+    /// Returns a new [`UnionScalar`]
+    #[inline]
+    pub fn new(data_type: DataType, type_: i8, value: Box<dyn Scalar>) -> Self {
+        Self {
+            value,
+            type_,
+            data_type,
+        }
+    }
+
+    /// Returns the inner value
+    #[inline]
+    pub fn value(&self) -> &Box<dyn Scalar> {
+        &self.value
+    }
+
+    /// Returns the type of the union scalar
+    #[inline]
+    pub fn type_(&self) -> i8 {
+        self.type_
+    }
+}
+
+impl Scalar for UnionScalar {
+    #[inline]
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    #[inline]
+    fn is_valid(&self) -> bool {
+        true
+    }
+
+    #[inline]
+    fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+}
diff --git a/crates/nano-arrow/src/scalar/utf8.rs b/crates/nano-arrow/src/scalar/utf8.rs
new file mode 100644
index 000000000000..ea08d30af578
--- /dev/null
+++ b/crates/nano-arrow/src/scalar/utf8.rs
@@ -0,0 +1,55 @@
+use super::Scalar;
+use crate::datatypes::DataType;
+use crate::offset::Offset;
+
+/// The implementation of [`Scalar`] for utf8, semantically equivalent to [`Option<String>`].
+#[derive(Debug, Clone, PartialEq, Eq)]
+pub struct Utf8Scalar<O: Offset> {
+    value: Option<String>,
+    phantom: std::marker::PhantomData<O>,
+}
+
+impl<O: Offset> Utf8Scalar<O> {
+    /// Returns a new [`Utf8Scalar`]
+    #[inline]
+    pub fn new<P: Into<String>>(value: Option<P>) -> Self {
+        Self {
+            value: value.map(|x| x.into()),
+            phantom: std::marker::PhantomData,
+        }
+    }
+
+    /// Returns the value irrespectively of the validity.
+    #[inline]
+    pub fn value(&self) -> Option<&str> {
+        self.value.as_ref().map(|x| x.as_ref())
+    }
+}
+
+impl<O: Offset, P: Into<String>> From<Option<P>> for Utf8Scalar<O> {
+    #[inline]
+    fn from(v: Option<P>) -> Self {
+        Self::new(v)
+    }
+}
+
+impl<O: Offset> Scalar for Utf8Scalar<O> {
+    #[inline]
+    fn as_any(&self) -> &dyn std::any::Any {
+        self
+    }
+
+    #[inline]
+    fn is_valid(&self) -> bool {
+        self.value.is_some()
+    }
+
+    #[inline]
+    fn data_type(&self) -> &DataType {
+        if O::IS_LARGE {
+            &DataType::LargeUtf8
+        } else {
+            &DataType::Utf8
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/temporal_conversions.rs b/crates/nano-arrow/src/temporal_conversions.rs
new file mode 100644
index 000000000000..5058d1d887bd
--- /dev/null
+++ b/crates/nano-arrow/src/temporal_conversions.rs
@@ -0,0 +1,543 @@
+//! Conversion methods for dates and times.
+
+use chrono::format::{parse, Parsed, StrftimeItems};
+use chrono::{Datelike, Duration, FixedOffset, NaiveDate, NaiveDateTime, NaiveTime};
+
+use crate::array::{PrimitiveArray, Utf8Array};
+use crate::datatypes::{DataType, TimeUnit};
+use crate::error::{Error, Result};
+use crate::offset::Offset;
+use crate::types::months_days_ns;
+
+/// Number of seconds in a day
+pub const SECONDS_IN_DAY: i64 = 86_400;
+/// Number of milliseconds in a second
+pub const MILLISECONDS: i64 = 1_000;
+/// Number of microseconds in a second
+pub const MICROSECONDS: i64 = 1_000_000;
+/// Number of nanoseconds in a second
+pub const NANOSECONDS: i64 = 1_000_000_000;
+/// Number of milliseconds in a day
+pub const MILLISECONDS_IN_DAY: i64 = SECONDS_IN_DAY * MILLISECONDS;
+/// Number of days between 0001-01-01 and 1970-01-01
+pub const EPOCH_DAYS_FROM_CE: i32 = 719_163;
+
+/// converts a `i32` representing a `date32` to [`NaiveDateTime`]
+#[inline]
+pub fn date32_to_datetime(v: i32) -> NaiveDateTime {
+    date32_to_datetime_opt(v).expect("invalid or out-of-range datetime")
+}
+
+/// converts a `i32` representing a `date32` to [`NaiveDateTime`]
+#[inline]
+pub fn date32_to_datetime_opt(v: i32) -> Option<NaiveDateTime> {
+    NaiveDateTime::from_timestamp_opt(v as i64 * SECONDS_IN_DAY, 0)
+}
+
+/// converts a `i32` representing a `date32` to [`NaiveDate`]
+#[inline]
+pub fn date32_to_date(days: i32) -> NaiveDate {
+    date32_to_date_opt(days).expect("out-of-range date")
+}
+
+/// converts a `i32` representing a `date32` to [`NaiveDate`]
+#[inline]
+pub fn date32_to_date_opt(days: i32) -> Option<NaiveDate> {
+    NaiveDate::from_num_days_from_ce_opt(EPOCH_DAYS_FROM_CE + days)
+}
+
+/// converts a `i64` representing a `date64` to [`NaiveDateTime`]
+#[inline]
+pub fn date64_to_datetime(v: i64) -> NaiveDateTime {
+    NaiveDateTime::from_timestamp_opt(
+        // extract seconds from milliseconds
+        v / MILLISECONDS,
+        // discard extracted seconds and convert milliseconds to nanoseconds
+        (v % MILLISECONDS * MICROSECONDS) as u32,
+    )
+    .expect("invalid or out-of-range datetime")
+}
+
+/// converts a `i64` representing a `date64` to [`NaiveDate`]
+#[inline]
+pub fn date64_to_date(milliseconds: i64) -> NaiveDate {
+    date64_to_datetime(milliseconds).date()
+}
+
+/// converts a `i32` representing a `time32(s)` to [`NaiveTime`]
+#[inline]
+pub fn time32s_to_time(v: i32) -> NaiveTime {
+    NaiveTime::from_num_seconds_from_midnight_opt(v as u32, 0).expect("invalid time")
+}
+
+/// converts a `i64` representing a `duration(s)` to [`Duration`]
+#[inline]
+pub fn duration_s_to_duration(v: i64) -> Duration {
+    Duration::seconds(v)
+}
+
+/// converts a `i64` representing a `duration(ms)` to [`Duration`]
+#[inline]
+pub fn duration_ms_to_duration(v: i64) -> Duration {
+    Duration::milliseconds(v)
+}
+
+/// converts a `i64` representing a `duration(us)` to [`Duration`]
+#[inline]
+pub fn duration_us_to_duration(v: i64) -> Duration {
+    Duration::microseconds(v)
+}
+
+/// converts a `i64` representing a `duration(ns)` to [`Duration`]
+#[inline]
+pub fn duration_ns_to_duration(v: i64) -> Duration {
+    Duration::nanoseconds(v)
+}
+
+/// converts a `i32` representing a `time32(ms)` to [`NaiveTime`]
+#[inline]
+pub fn time32ms_to_time(v: i32) -> NaiveTime {
+    let v = v as i64;
+    let seconds = v / MILLISECONDS;
+
+    let milli_to_nano = 1_000_000;
+    let nano = (v - seconds * MILLISECONDS) * milli_to_nano;
+    NaiveTime::from_num_seconds_from_midnight_opt(seconds as u32, nano as u32)
+        .expect("invalid time")
+}
+
+/// converts a `i64` representing a `time64(us)` to [`NaiveTime`]
+#[inline]
+pub fn time64us_to_time(v: i64) -> NaiveTime {
+    time64us_to_time_opt(v).expect("invalid time")
+}
+
+/// converts a `i64` representing a `time64(us)` to [`NaiveTime`]
+#[inline]
+pub fn time64us_to_time_opt(v: i64) -> Option<NaiveTime> {
+    NaiveTime::from_num_seconds_from_midnight_opt(
+        // extract seconds from microseconds
+        (v / MICROSECONDS) as u32,
+        // discard extracted seconds and convert microseconds to
+        // nanoseconds
+        (v % MICROSECONDS * MILLISECONDS) as u32,
+    )
+}
+
+/// converts a `i64` representing a `time64(ns)` to [`NaiveTime`]
+#[inline]
+pub fn time64ns_to_time(v: i64) -> NaiveTime {
+    time64ns_to_time_opt(v).expect("invalid time")
+}
+
+/// converts a `i64` representing a `time64(ns)` to [`NaiveTime`]
+#[inline]
+pub fn time64ns_to_time_opt(v: i64) -> Option<NaiveTime> {
+    NaiveTime::from_num_seconds_from_midnight_opt(
+        // extract seconds from nanoseconds
+        (v / NANOSECONDS) as u32,
+        // discard extracted seconds
+        (v % NANOSECONDS) as u32,
+    )
+}
+
+/// converts a `i64` representing a `timestamp(s)` to [`NaiveDateTime`]
+#[inline]
+pub fn timestamp_s_to_datetime(seconds: i64) -> NaiveDateTime {
+    timestamp_s_to_datetime_opt(seconds).expect("invalid or out-of-range datetime")
+}
+
+/// converts a `i64` representing a `timestamp(s)` to [`NaiveDateTime`]
+#[inline]
+pub fn timestamp_s_to_datetime_opt(seconds: i64) -> Option<NaiveDateTime> {
+    NaiveDateTime::from_timestamp_opt(seconds, 0)
+}
+
+/// converts a `i64` representing a `timestamp(ms)` to [`NaiveDateTime`]
+#[inline]
+pub fn timestamp_ms_to_datetime(v: i64) -> NaiveDateTime {
+    timestamp_ms_to_datetime_opt(v).expect("invalid or out-of-range datetime")
+}
+
+/// converts a `i64` representing a `timestamp(ms)` to [`NaiveDateTime`]
+#[inline]
+pub fn timestamp_ms_to_datetime_opt(v: i64) -> Option<NaiveDateTime> {
+    if v >= 0 {
+        NaiveDateTime::from_timestamp_opt(
+            // extract seconds from milliseconds
+            v / MILLISECONDS,
+            // discard extracted seconds and convert milliseconds to nanoseconds
+            (v % MILLISECONDS * MICROSECONDS) as u32,
+        )
+    } else {
+        let secs_rem = (v / MILLISECONDS, v % MILLISECONDS);
+        if secs_rem.1 == 0 {
+            // whole/integer seconds; no adjustment required
+            NaiveDateTime::from_timestamp_opt(secs_rem.0, 0)
+        } else {
+            // negative values with fractional seconds require 'div_floor' rounding behaviour.
+            // (which isn't yet stabilised: https://github.com/rust-lang/rust/issues/88581)
+            NaiveDateTime::from_timestamp_opt(
+                secs_rem.0 - 1,
+                (NANOSECONDS + (v % MILLISECONDS * MICROSECONDS)) as u32,
+            )
+        }
+    }
+}
+
+/// converts a `i64` representing a `timestamp(us)` to [`NaiveDateTime`]
+#[inline]
+pub fn timestamp_us_to_datetime(v: i64) -> NaiveDateTime {
+    timestamp_us_to_datetime_opt(v).expect("invalid or out-of-range datetime")
+}
+
+/// converts a `i64` representing a `timestamp(us)` to [`NaiveDateTime`]
+#[inline]
+pub fn timestamp_us_to_datetime_opt(v: i64) -> Option<NaiveDateTime> {
+    if v >= 0 {
+        NaiveDateTime::from_timestamp_opt(
+            // extract seconds from microseconds
+            v / MICROSECONDS,
+            // discard extracted seconds and convert microseconds to nanoseconds
+            (v % MICROSECONDS * MILLISECONDS) as u32,
+        )
+    } else {
+        let secs_rem = (v / MICROSECONDS, v % MICROSECONDS);
+        if secs_rem.1 == 0 {
+            // whole/integer seconds; no adjustment required
+            NaiveDateTime::from_timestamp_opt(secs_rem.0, 0)
+        } else {
+            // negative values with fractional seconds require 'div_floor' rounding behaviour.
+            // (which isn't yet stabilised: https://github.com/rust-lang/rust/issues/88581)
+            NaiveDateTime::from_timestamp_opt(
+                secs_rem.0 - 1,
+                (NANOSECONDS + (v % MICROSECONDS * MILLISECONDS)) as u32,
+            )
+        }
+    }
+}
+
+/// converts a `i64` representing a `timestamp(ns)` to [`NaiveDateTime`]
+#[inline]
+pub fn timestamp_ns_to_datetime(v: i64) -> NaiveDateTime {
+    timestamp_ns_to_datetime_opt(v).expect("invalid or out-of-range datetime")
+}
+
+/// converts a `i64` representing a `timestamp(ns)` to [`NaiveDateTime`]
+#[inline]
+pub fn timestamp_ns_to_datetime_opt(v: i64) -> Option<NaiveDateTime> {
+    if v >= 0 {
+        NaiveDateTime::from_timestamp_opt(
+            // extract seconds from nanoseconds
+            v / NANOSECONDS,
+            // discard extracted seconds
+            (v % NANOSECONDS) as u32,
+        )
+    } else {
+        let secs_rem = (v / NANOSECONDS, v % NANOSECONDS);
+        if secs_rem.1 == 0 {
+            // whole/integer seconds; no adjustment required
+            NaiveDateTime::from_timestamp_opt(secs_rem.0, 0)
+        } else {
+            // negative values with fractional seconds require 'div_floor' rounding behaviour.
+            // (which isn't yet stabilised: https://github.com/rust-lang/rust/issues/88581)
+            NaiveDateTime::from_timestamp_opt(
+                secs_rem.0 - 1,
+                (NANOSECONDS + (v % NANOSECONDS)) as u32,
+            )
+        }
+    }
+}
+
+/// Converts a timestamp in `time_unit` and `timezone` into [`chrono::DateTime`].
+#[inline]
+pub fn timestamp_to_naive_datetime(timestamp: i64, time_unit: TimeUnit) -> chrono::NaiveDateTime {
+    match time_unit {
+        TimeUnit::Second => timestamp_s_to_datetime(timestamp),
+        TimeUnit::Millisecond => timestamp_ms_to_datetime(timestamp),
+        TimeUnit::Microsecond => timestamp_us_to_datetime(timestamp),
+        TimeUnit::Nanosecond => timestamp_ns_to_datetime(timestamp),
+    }
+}
+
+/// Converts a timestamp in `time_unit` and `timezone` into [`chrono::DateTime`].
+#[inline]
+pub fn timestamp_to_datetime<T: chrono::TimeZone>(
+    timestamp: i64,
+    time_unit: TimeUnit,
+    timezone: &T,
+) -> chrono::DateTime<T> {
+    timezone.from_utc_datetime(&timestamp_to_naive_datetime(timestamp, time_unit))
+}
+
+/// Calculates the scale factor between two TimeUnits. The function returns the
+/// scale that should multiply the TimeUnit "b" to have the same time scale as
+/// the TimeUnit "a".
+pub fn timeunit_scale(a: TimeUnit, b: TimeUnit) -> f64 {
+    match (a, b) {
+        (TimeUnit::Second, TimeUnit::Second) => 1.0,
+        (TimeUnit::Second, TimeUnit::Millisecond) => 0.001,
+        (TimeUnit::Second, TimeUnit::Microsecond) => 0.000_001,
+        (TimeUnit::Second, TimeUnit::Nanosecond) => 0.000_000_001,
+        (TimeUnit::Millisecond, TimeUnit::Second) => 1_000.0,
+        (TimeUnit::Millisecond, TimeUnit::Millisecond) => 1.0,
+        (TimeUnit::Millisecond, TimeUnit::Microsecond) => 0.001,
+        (TimeUnit::Millisecond, TimeUnit::Nanosecond) => 0.000_001,
+        (TimeUnit::Microsecond, TimeUnit::Second) => 1_000_000.0,
+        (TimeUnit::Microsecond, TimeUnit::Millisecond) => 1_000.0,
+        (TimeUnit::Microsecond, TimeUnit::Microsecond) => 1.0,
+        (TimeUnit::Microsecond, TimeUnit::Nanosecond) => 0.001,
+        (TimeUnit::Nanosecond, TimeUnit::Second) => 1_000_000_000.0,
+        (TimeUnit::Nanosecond, TimeUnit::Millisecond) => 1_000_000.0,
+        (TimeUnit::Nanosecond, TimeUnit::Microsecond) => 1_000.0,
+        (TimeUnit::Nanosecond, TimeUnit::Nanosecond) => 1.0,
+    }
+}
+
+/// Parses an offset of the form `"+WX:YZ"` or `"UTC"` into [`FixedOffset`].
+/// # Errors
+/// If the offset is not in any of the allowed forms.
+pub fn parse_offset(offset: &str) -> Result<FixedOffset> {
+    if offset == "UTC" {
+        return Ok(FixedOffset::east_opt(0).expect("FixedOffset::east out of bounds"));
+    }
+    let error = "timezone offset must be of the form [-]00:00";
+
+    let mut a = offset.split(':');
+    let first = a
+        .next()
+        .map(Ok)
+        .unwrap_or_else(|| Err(Error::InvalidArgumentError(error.to_string())))?;
+    let last = a
+        .next()
+        .map(Ok)
+        .unwrap_or_else(|| Err(Error::InvalidArgumentError(error.to_string())))?;
+    let hours: i32 = first
+        .parse()
+        .map_err(|_| Error::InvalidArgumentError(error.to_string()))?;
+    let minutes: i32 = last
+        .parse()
+        .map_err(|_| Error::InvalidArgumentError(error.to_string()))?;
+
+    Ok(FixedOffset::east_opt(hours * 60 * 60 + minutes * 60)
+        .expect("FixedOffset::east out of bounds"))
+}
+
+/// Parses `value` to `Option<i64>` consistent with the Arrow's definition of timestamp with timezone.
+/// `tz` must be built from `timezone` (either via [`parse_offset`] or `chrono-tz`).
+#[inline]
+pub fn utf8_to_timestamp_ns_scalar<T: chrono::TimeZone>(
+    value: &str,
+    fmt: &str,
+    tz: &T,
+) -> Option<i64> {
+    utf8_to_timestamp_scalar(value, fmt, tz, &TimeUnit::Nanosecond)
+}
+
+/// Parses `value` to `Option<i64>` consistent with the Arrow's definition of timestamp with timezone.
+/// `tz` must be built from `timezone` (either via [`parse_offset`] or `chrono-tz`).
+/// Returns in scale `tz` of `TimeUnit`.
+#[inline]
+pub fn utf8_to_timestamp_scalar<T: chrono::TimeZone>(
+    value: &str,
+    fmt: &str,
+    tz: &T,
+    tu: &TimeUnit,
+) -> Option<i64> {
+    let mut parsed = Parsed::new();
+    let fmt = StrftimeItems::new(fmt);
+    let r = parse(&mut parsed, value, fmt).ok();
+    if r.is_some() {
+        parsed
+            .to_datetime()
+            .map(|x| x.naive_utc())
+            .map(|x| tz.from_utc_datetime(&x))
+            .map(|x| match tu {
+                TimeUnit::Second => x.timestamp(),
+                TimeUnit::Millisecond => x.timestamp_millis(),
+                TimeUnit::Microsecond => x.timestamp_micros(),
+                TimeUnit::Nanosecond => x.timestamp_nanos_opt().unwrap(),
+            })
+            .ok()
+    } else {
+        None
+    }
+}
+
+/// Parses `value` to `Option<i64>` consistent with the Arrow's definition of timestamp without timezone.
+#[inline]
+pub fn utf8_to_naive_timestamp_ns_scalar(value: &str, fmt: &str) -> Option<i64> {
+    utf8_to_naive_timestamp_scalar(value, fmt, &TimeUnit::Nanosecond)
+}
+
+/// Parses `value` to `Option<i64>` consistent with the Arrow's definition of timestamp without timezone.
+/// Returns in scale `tz` of `TimeUnit`.
+#[inline]
+pub fn utf8_to_naive_timestamp_scalar(value: &str, fmt: &str, tu: &TimeUnit) -> Option<i64> {
+    let fmt = StrftimeItems::new(fmt);
+    let mut parsed = Parsed::new();
+    parse(&mut parsed, value, fmt.clone()).ok();
+    parsed
+        .to_naive_datetime_with_offset(0)
+        .map(|x| match tu {
+            TimeUnit::Second => x.timestamp(),
+            TimeUnit::Millisecond => x.timestamp_millis(),
+            TimeUnit::Microsecond => x.timestamp_micros(),
+            TimeUnit::Nanosecond => x.timestamp_nanos_opt().unwrap(),
+        })
+        .ok()
+}
+
+fn utf8_to_timestamp_ns_impl<O: Offset, T: chrono::TimeZone>(
+    array: &Utf8Array<O>,
+    fmt: &str,
+    timezone: String,
+    tz: T,
+) -> PrimitiveArray<i64> {
+    let iter = array
+        .iter()
+        .map(|x| x.and_then(|x| utf8_to_timestamp_ns_scalar(x, fmt, &tz)));
+
+    PrimitiveArray::from_trusted_len_iter(iter)
+        .to(DataType::Timestamp(TimeUnit::Nanosecond, Some(timezone)))
+}
+
+/// Parses `value` to a [`chrono_tz::Tz`] with the Arrow's definition of timestamp with a timezone.
+#[cfg(feature = "chrono-tz")]
+#[cfg_attr(docsrs, doc(cfg(feature = "chrono-tz")))]
+pub fn parse_offset_tz(timezone: &str) -> Result<chrono_tz::Tz> {
+    timezone.parse::<chrono_tz::Tz>().map_err(|_| {
+        Error::InvalidArgumentError(format!("timezone \"{timezone}\" cannot be parsed"))
+    })
+}
+
+#[cfg(feature = "chrono-tz")]
+#[cfg_attr(docsrs, doc(cfg(feature = "chrono-tz")))]
+fn chrono_tz_utf_to_timestamp_ns<O: Offset>(
+    array: &Utf8Array<O>,
+    fmt: &str,
+    timezone: String,
+) -> Result<PrimitiveArray<i64>> {
+    let tz = parse_offset_tz(&timezone)?;
+    Ok(utf8_to_timestamp_ns_impl(array, fmt, timezone, tz))
+}
+
+#[cfg(not(feature = "chrono-tz"))]
+fn chrono_tz_utf_to_timestamp_ns<O: Offset>(
+    _: &Utf8Array<O>,
+    _: &str,
+    timezone: String,
+) -> Result<PrimitiveArray<i64>> {
+    Err(Error::InvalidArgumentError(format!(
+        "timezone \"{timezone}\" cannot be parsed (feature chrono-tz is not active)",
+    )))
+}
+
+/// Parses a [`Utf8Array`] to a timeozone-aware timestamp, i.e. [`PrimitiveArray<i64>`] with type `Timestamp(Nanosecond, Some(timezone))`.
+/// # Implementation
+/// * parsed values with timezone other than `timezone` are converted to `timezone`.
+/// * parsed values without timezone are null. Use [`utf8_to_naive_timestamp_ns`] to parse naive timezones.
+/// * Null elements remain null; non-parsable elements are null.
+/// The feature `"chrono-tz"` enables IANA and zoneinfo formats for `timezone`.
+/// # Error
+/// This function errors iff `timezone` is not parsable to an offset.
+pub fn utf8_to_timestamp_ns<O: Offset>(
+    array: &Utf8Array<O>,
+    fmt: &str,
+    timezone: String,
+) -> Result<PrimitiveArray<i64>> {
+    let tz = parse_offset(timezone.as_str());
+
+    if let Ok(tz) = tz {
+        Ok(utf8_to_timestamp_ns_impl(array, fmt, timezone, tz))
+    } else {
+        chrono_tz_utf_to_timestamp_ns(array, fmt, timezone)
+    }
+}
+
+/// Parses a [`Utf8Array`] to naive timestamp, i.e.
+/// [`PrimitiveArray<i64>`] with type `Timestamp(Nanosecond, None)`.
+/// Timezones are ignored.
+/// Null elements remain null; non-parsable elements are set to null.
+pub fn utf8_to_naive_timestamp_ns<O: Offset>(
+    array: &Utf8Array<O>,
+    fmt: &str,
+) -> PrimitiveArray<i64> {
+    let iter = array
+        .iter()
+        .map(|x| x.and_then(|x| utf8_to_naive_timestamp_ns_scalar(x, fmt)));
+
+    PrimitiveArray::from_trusted_len_iter(iter).to(DataType::Timestamp(TimeUnit::Nanosecond, None))
+}
+
+fn add_month(year: i32, month: u32, months: i32) -> chrono::NaiveDate {
+    let new_year = (year * 12 + (month - 1) as i32 + months) / 12;
+    let new_month = (year * 12 + (month - 1) as i32 + months) % 12 + 1;
+    chrono::NaiveDate::from_ymd_opt(new_year, new_month as u32, 1)
+        .expect("invalid or out-of-range date")
+}
+
+fn get_days_between_months(year: i32, month: u32, months: i32) -> i64 {
+    add_month(year, month, months)
+        .signed_duration_since(
+            chrono::NaiveDate::from_ymd_opt(year, month, 1).expect("invalid or out-of-range date"),
+        )
+        .num_days()
+}
+
+/// Adds an `interval` to a `timestamp` in `time_unit` units without timezone.
+#[inline]
+pub fn add_naive_interval(timestamp: i64, time_unit: TimeUnit, interval: months_days_ns) -> i64 {
+    // convert seconds to a DateTime of a given offset.
+    let datetime = match time_unit {
+        TimeUnit::Second => timestamp_s_to_datetime(timestamp),
+        TimeUnit::Millisecond => timestamp_ms_to_datetime(timestamp),
+        TimeUnit::Microsecond => timestamp_us_to_datetime(timestamp),
+        TimeUnit::Nanosecond => timestamp_ns_to_datetime(timestamp),
+    };
+
+    // compute the number of days in the interval, which depends on the particular year and month (leap days)
+    let delta_days = get_days_between_months(datetime.year(), datetime.month(), interval.months())
+        + interval.days() as i64;
+
+    // add; no leap hours are considered
+    let new_datetime_tz = datetime
+        + chrono::Duration::nanoseconds(delta_days * 24 * 60 * 60 * 1_000_000_000 + interval.ns());
+
+    // convert back to the target unit
+    match time_unit {
+        TimeUnit::Second => new_datetime_tz.timestamp_millis() / 1000,
+        TimeUnit::Millisecond => new_datetime_tz.timestamp_millis(),
+        TimeUnit::Microsecond => new_datetime_tz.timestamp_nanos_opt().unwrap() / 1000,
+        TimeUnit::Nanosecond => new_datetime_tz.timestamp_nanos_opt().unwrap(),
+    }
+}
+
+/// Adds an `interval` to a `timestamp` in `time_unit` units and timezone `timezone`.
+#[inline]
+pub fn add_interval<T: chrono::TimeZone>(
+    timestamp: i64,
+    time_unit: TimeUnit,
+    interval: months_days_ns,
+    timezone: &T,
+) -> i64 {
+    // convert seconds to a DateTime of a given offset.
+    let datetime_tz = timestamp_to_datetime(timestamp, time_unit, timezone);
+
+    // compute the number of days in the interval, which depends on the particular year and month (leap days)
+    let delta_days =
+        get_days_between_months(datetime_tz.year(), datetime_tz.month(), interval.months())
+            + interval.days() as i64;
+
+    // add; tz will take care of leap hours
+    let new_datetime_tz = datetime_tz
+        + chrono::Duration::nanoseconds(delta_days * 24 * 60 * 60 * 1_000_000_000 + interval.ns());
+
+    // convert back to the target unit
+    match time_unit {
+        TimeUnit::Second => new_datetime_tz.timestamp_millis() / 1000,
+        TimeUnit::Millisecond => new_datetime_tz.timestamp_millis(),
+        TimeUnit::Microsecond => new_datetime_tz.timestamp_nanos_opt().unwrap() / 1000,
+        TimeUnit::Nanosecond => new_datetime_tz.timestamp_nanos_opt().unwrap(),
+    }
+}
diff --git a/crates/nano-arrow/src/trusted_len.rs b/crates/nano-arrow/src/trusted_len.rs
new file mode 100644
index 000000000000..a1c38bd51c71
--- /dev/null
+++ b/crates/nano-arrow/src/trusted_len.rs
@@ -0,0 +1,57 @@
+//! Declares [`TrustedLen`].
+use std::slice::Iter;
+
+/// An iterator of known, fixed size.
+/// A trait denoting Rusts' unstable [TrustedLen](https://doc.rust-lang.org/std/iter/trait.TrustedLen.html).
+/// This is re-defined here and implemented for some iterators until `std::iter::TrustedLen`
+/// is stabilized.
+///
+/// # Safety
+/// This trait must only be implemented when the contract is upheld.
+/// Consumers of this trait must inspect Iterator::size_hint()’s upper bound.
+pub unsafe trait TrustedLen: Iterator {}
+
+unsafe impl<T> TrustedLen for Iter<'_, T> {}
+
+unsafe impl<B, I: TrustedLen, T: FnMut(I::Item) -> B> TrustedLen for std::iter::Map<I, T> {}
+
+unsafe impl<'a, I, T: 'a> TrustedLen for std::iter::Copied<I>
+where
+    I: TrustedLen<Item = &'a T>,
+    T: Copy,
+{
+}
+unsafe impl<'a, I, T: 'a> TrustedLen for std::iter::Cloned<I>
+where
+    I: TrustedLen<Item = &'a T>,
+    T: Clone,
+{
+}
+
+unsafe impl<I> TrustedLen for std::iter::Enumerate<I> where I: TrustedLen {}
+
+unsafe impl<A, B> TrustedLen for std::iter::Zip<A, B>
+where
+    A: TrustedLen,
+    B: TrustedLen,
+{
+}
+
+unsafe impl<T> TrustedLen for std::slice::ChunksExact<'_, T> {}
+
+unsafe impl<T> TrustedLen for std::slice::Windows<'_, T> {}
+
+unsafe impl<A, B> TrustedLen for std::iter::Chain<A, B>
+where
+    A: TrustedLen,
+    B: TrustedLen<Item = A::Item>,
+{
+}
+
+unsafe impl<T> TrustedLen for std::iter::Once<T> {}
+
+unsafe impl<T> TrustedLen for std::vec::IntoIter<T> {}
+
+unsafe impl<A: Clone> TrustedLen for std::iter::Repeat<A> {}
+unsafe impl<A, F: FnMut() -> A> TrustedLen for std::iter::RepeatWith<F> {}
+unsafe impl<A: TrustedLen> TrustedLen for std::iter::Take<A> {}
diff --git a/crates/nano-arrow/src/types/bit_chunk.rs b/crates/nano-arrow/src/types/bit_chunk.rs
new file mode 100644
index 000000000000..ef4b25fd28a2
--- /dev/null
+++ b/crates/nano-arrow/src/types/bit_chunk.rs
@@ -0,0 +1,161 @@
+use std::fmt::Binary;
+use std::ops::{BitAndAssign, Not, Shl, ShlAssign, ShrAssign};
+
+use num_traits::PrimInt;
+
+use super::NativeType;
+
+/// A chunk of bits. This is used to create masks of a given length
+/// whose width is `1` bit. In `portable_simd` notation, this corresponds to `m1xY`.
+///
+/// This (sealed) trait is implemented for [`u8`], [`u16`], [`u32`] and [`u64`].
+pub trait BitChunk:
+    super::private::Sealed
+    + PrimInt
+    + NativeType
+    + Binary
+    + ShlAssign
+    + Not<Output = Self>
+    + ShrAssign<usize>
+    + ShlAssign<usize>
+    + Shl<usize, Output = Self>
+    + BitAndAssign
+{
+    /// convert itself into bytes.
+    fn to_ne_bytes(self) -> Self::Bytes;
+    /// convert itself from bytes.
+    fn from_ne_bytes(v: Self::Bytes) -> Self;
+}
+
+macro_rules! bit_chunk {
+    ($ty:ty) => {
+        impl BitChunk for $ty {
+            #[inline(always)]
+            fn to_ne_bytes(self) -> Self::Bytes {
+                self.to_ne_bytes()
+            }
+
+            #[inline(always)]
+            fn from_ne_bytes(v: Self::Bytes) -> Self {
+                Self::from_ne_bytes(v)
+            }
+        }
+    };
+}
+
+bit_chunk!(u8);
+bit_chunk!(u16);
+bit_chunk!(u32);
+bit_chunk!(u64);
+
+/// An [`Iterator<Item=bool>`] over a [`BitChunk`]. This iterator is often
+/// compiled to SIMD.
+/// The [LSB](https://en.wikipedia.org/wiki/Bit_numbering#Least_significant_bit) corresponds
+/// to the first slot, as defined by the arrow specification.
+/// # Example
+/// ```
+/// use arrow2::types::BitChunkIter;
+/// let a = 0b00010000u8;
+/// let iter = BitChunkIter::new(a, 7);
+/// let r = iter.collect::<Vec<_>>();
+/// assert_eq!(r, vec![false, false, false, false, true, false, false]);
+/// ```
+pub struct BitChunkIter<T: BitChunk> {
+    value: T,
+    mask: T,
+    remaining: usize,
+}
+
+impl<T: BitChunk> BitChunkIter<T> {
+    /// Creates a new [`BitChunkIter`] with `len` bits.
+    #[inline]
+    pub fn new(value: T, len: usize) -> Self {
+        assert!(len <= std::mem::size_of::<T>() * 8);
+        Self {
+            value,
+            remaining: len,
+            mask: T::one(),
+        }
+    }
+}
+
+impl<T: BitChunk> Iterator for BitChunkIter<T> {
+    type Item = bool;
+
+    #[inline]
+    fn next(&mut self) -> Option<Self::Item> {
+        if self.remaining == 0 {
+            return None;
+        };
+        let result = Some(self.value & self.mask != T::zero());
+        self.remaining -= 1;
+        self.mask <<= 1;
+        result
+    }
+
+    #[inline]
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        (self.remaining, Some(self.remaining))
+    }
+}
+
+// # Safety
+// a mathematical invariant of this iterator
+unsafe impl<T: BitChunk> crate::trusted_len::TrustedLen for BitChunkIter<T> {}
+
+/// An [`Iterator<Item=usize>`] over a [`BitChunk`] returning the index of each bit set in the chunk
+/// See <https://lemire.me/blog/2018/03/08/iterating-over-set-bits-quickly-simd-edition/> for details
+/// # Example
+/// ```
+/// use arrow2::types::BitChunkOnes;
+/// let a = 0b00010000u8;
+/// let iter = BitChunkOnes::new(a);
+/// let r = iter.collect::<Vec<_>>();
+/// assert_eq!(r, vec![4]);
+/// ```
+pub struct BitChunkOnes<T: BitChunk> {
+    value: T,
+    remaining: usize,
+}
+
+impl<T: BitChunk> BitChunkOnes<T> {
+    /// Creates a new [`BitChunkOnes`] with `len` bits.
+    #[inline]
+    pub fn new(value: T) -> Self {
+        Self {
+            value,
+            remaining: value.count_ones() as usize,
+        }
+    }
+
+    #[inline]
+    #[cfg(feature = "compute_filter")]
+    pub(crate) fn from_known_count(value: T, remaining: usize) -> Self {
+        Self { value, remaining }
+    }
+}
+
+impl<T: BitChunk> Iterator for BitChunkOnes<T> {
+    type Item = usize;
+
+    #[inline]
+    fn next(&mut self) -> Option<Self::Item> {
+        if self.remaining == 0 {
+            return None;
+        }
+        let v = self.value.trailing_zeros() as usize;
+        self.value &= self.value - T::one();
+
+        self.remaining -= 1;
+        Some(v)
+    }
+
+    #[inline]
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        (self.remaining, Some(self.remaining))
+    }
+}
+
+// # Safety
+// a mathematical invariant of this iterator
+unsafe impl<T: BitChunk> crate::trusted_len::TrustedLen for BitChunkOnes<T> {}
diff --git a/crates/nano-arrow/src/types/index.rs b/crates/nano-arrow/src/types/index.rs
new file mode 100644
index 000000000000..0aedea008fa3
--- /dev/null
+++ b/crates/nano-arrow/src/types/index.rs
@@ -0,0 +1,103 @@
+use std::convert::TryFrom;
+
+use super::NativeType;
+use crate::trusted_len::TrustedLen;
+
+/// Sealed trait describing the subset of [`NativeType`] (`i32`, `i64`, `u32` and `u64`)
+/// that can be used to index a slot of an array.
+pub trait Index:
+    NativeType
+    + std::ops::AddAssign
+    + std::ops::Sub<Output = Self>
+    + num_traits::One
+    + num_traits::Num
+    + num_traits::CheckedAdd
+    + PartialOrd
+    + Ord
+{
+    /// Convert itself to [`usize`].
+    fn to_usize(&self) -> usize;
+    /// Convert itself from [`usize`].
+    fn from_usize(index: usize) -> Option<Self>;
+
+    /// Convert itself from [`usize`].
+    fn from_as_usize(index: usize) -> Self;
+
+    /// An iterator from (inclusive) `start` to (exclusive) `end`.
+    fn range(start: usize, end: usize) -> Option<IndexRange<Self>> {
+        let start = Self::from_usize(start);
+        let end = Self::from_usize(end);
+        match (start, end) {
+            (Some(start), Some(end)) => Some(IndexRange::new(start, end)),
+            _ => None,
+        }
+    }
+}
+
+macro_rules! index {
+    ($t:ty) => {
+        impl Index for $t {
+            #[inline]
+            fn to_usize(&self) -> usize {
+                *self as usize
+            }
+
+            #[inline]
+            fn from_usize(value: usize) -> Option<Self> {
+                Self::try_from(value).ok()
+            }
+
+            #[inline]
+            fn from_as_usize(value: usize) -> Self {
+                value as $t
+            }
+        }
+    };
+}
+
+index!(i8);
+index!(i16);
+index!(i32);
+index!(i64);
+index!(u8);
+index!(u16);
+index!(u32);
+index!(u64);
+
+/// Range of [`Index`], equivalent to `(a..b)`.
+/// `Step` is unstable in Rust, which does not allow us to implement (a..b) for [`Index`].
+pub struct IndexRange<I: Index> {
+    start: I,
+    end: I,
+}
+
+impl<I: Index> IndexRange<I> {
+    /// Returns a new [`IndexRange`].
+    pub fn new(start: I, end: I) -> Self {
+        assert!(end >= start);
+        Self { start, end }
+    }
+}
+
+impl<I: Index> Iterator for IndexRange<I> {
+    type Item = I;
+
+    #[inline]
+    fn next(&mut self) -> Option<Self::Item> {
+        if self.start == self.end {
+            return None;
+        }
+        let old = self.start;
+        self.start += I::one();
+        Some(old)
+    }
+
+    #[inline]
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        let len = (self.end - self.start).to_usize();
+        (len, Some(len))
+    }
+}
+
+/// Safety: a range is always of known length
+unsafe impl<I: Index> TrustedLen for IndexRange<I> {}
diff --git a/crates/nano-arrow/src/types/mod.rs b/crates/nano-arrow/src/types/mod.rs
new file mode 100644
index 000000000000..2ba57b4d784a
--- /dev/null
+++ b/crates/nano-arrow/src/types/mod.rs
@@ -0,0 +1,89 @@
+//! Sealed traits and implementations to handle all _physical types_ used in this crate.
+//!
+//! Most physical types used in this crate are native Rust types, such as `i32`.
+//! The trait [`NativeType`] describes the interfaces required by this crate to be conformant
+//! with Arrow.
+//!
+//! Every implementation of [`NativeType`] has an associated variant in [`PrimitiveType`],
+//! available via [`NativeType::PRIMITIVE`].
+//! Combined, these allow structs generic over [`NativeType`] to be trait objects downcastable
+//! to concrete implementations based on the matched [`NativeType::PRIMITIVE`] variant.
+//!
+//! Another important trait in this module is [`Offset`], the subset of [`NativeType`] that can
+//! be used in Arrow offsets (`i32` and `i64`).
+//!
+//! Another important trait in this module is [`BitChunk`], describing types that can be used to
+//! represent chunks of bits (e.g. 8 bits via `u8`, 16 via `u16`), and [`BitChunkIter`],
+//! that can be used to iterate over bitmaps in [`BitChunk`]s according to
+//! Arrow's definition of bitmaps.
+//!
+//! Finally, this module contains traits used to compile code based on [`NativeType`] optimized
+//! for SIMD, at [`mod@simd`].
+
+mod bit_chunk;
+pub use bit_chunk::{BitChunk, BitChunkIter, BitChunkOnes};
+mod index;
+pub mod simd;
+pub use index::*;
+mod native;
+pub use native::*;
+mod offset;
+pub use offset::*;
+#[cfg(feature = "serde_types")]
+use serde_derive::{Deserialize, Serialize};
+
+/// The set of all implementations of the sealed trait [`NativeType`].
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Hash)]
+#[cfg_attr(feature = "serde_types", derive(Serialize, Deserialize))]
+pub enum PrimitiveType {
+    /// A signed 8-bit integer.
+    Int8,
+    /// A signed 16-bit integer.
+    Int16,
+    /// A signed 32-bit integer.
+    Int32,
+    /// A signed 64-bit integer.
+    Int64,
+    /// A signed 128-bit integer.
+    Int128,
+    /// A signed 256-bit integer.
+    Int256,
+    /// An unsigned 8-bit integer.
+    UInt8,
+    /// An unsigned 16-bit integer.
+    UInt16,
+    /// An unsigned 32-bit integer.
+    UInt32,
+    /// An unsigned 64-bit integer.
+    UInt64,
+    /// A 16-bit floating point number.
+    Float16,
+    /// A 32-bit floating point number.
+    Float32,
+    /// A 64-bit floating point number.
+    Float64,
+    /// Two i32 representing days and ms
+    DaysMs,
+    /// months_days_ns(i32, i32, i64)
+    MonthDayNano,
+}
+
+mod private {
+    pub trait Sealed {}
+
+    impl Sealed for u8 {}
+    impl Sealed for u16 {}
+    impl Sealed for u32 {}
+    impl Sealed for u64 {}
+    impl Sealed for i8 {}
+    impl Sealed for i16 {}
+    impl Sealed for i32 {}
+    impl Sealed for i64 {}
+    impl Sealed for i128 {}
+    impl Sealed for super::i256 {}
+    impl Sealed for super::f16 {}
+    impl Sealed for f32 {}
+    impl Sealed for f64 {}
+    impl Sealed for super::days_ms {}
+    impl Sealed for super::months_days_ns {}
+}
diff --git a/crates/nano-arrow/src/types/native.rs b/crates/nano-arrow/src/types/native.rs
new file mode 100644
index 000000000000..6e50a1454ead
--- /dev/null
+++ b/crates/nano-arrow/src/types/native.rs
@@ -0,0 +1,639 @@
+use std::convert::TryFrom;
+use std::ops::Neg;
+use std::panic::RefUnwindSafe;
+
+use bytemuck::{Pod, Zeroable};
+
+use super::PrimitiveType;
+
+/// Sealed trait implemented by all physical types that can be allocated,
+/// serialized and deserialized by this crate.
+/// All O(N) allocations in this crate are done for this trait alone.
+pub trait NativeType:
+    super::private::Sealed
+    + Pod
+    + Send
+    + Sync
+    + Sized
+    + RefUnwindSafe
+    + std::fmt::Debug
+    + std::fmt::Display
+    + PartialEq
+    + Default
+{
+    /// The corresponding variant of [`PrimitiveType`].
+    const PRIMITIVE: PrimitiveType;
+
+    /// Type denoting its representation as bytes.
+    /// This is `[u8; N]` where `N = size_of::<T>`.
+    type Bytes: AsRef<[u8]>
+        + std::ops::Index<usize, Output = u8>
+        + std::ops::IndexMut<usize, Output = u8>
+        + for<'a> TryFrom<&'a [u8]>
+        + std::fmt::Debug
+        + Default;
+
+    /// To bytes in little endian
+    fn to_le_bytes(&self) -> Self::Bytes;
+
+    /// To bytes in big endian
+    fn to_be_bytes(&self) -> Self::Bytes;
+
+    /// From bytes in little endian
+    fn from_le_bytes(bytes: Self::Bytes) -> Self;
+
+    /// From bytes in big endian
+    fn from_be_bytes(bytes: Self::Bytes) -> Self;
+}
+
+macro_rules! native_type {
+    ($type:ty, $primitive_type:expr) => {
+        impl NativeType for $type {
+            const PRIMITIVE: PrimitiveType = $primitive_type;
+
+            type Bytes = [u8; std::mem::size_of::<Self>()];
+            #[inline]
+            fn to_le_bytes(&self) -> Self::Bytes {
+                Self::to_le_bytes(*self)
+            }
+
+            #[inline]
+            fn to_be_bytes(&self) -> Self::Bytes {
+                Self::to_be_bytes(*self)
+            }
+
+            #[inline]
+            fn from_le_bytes(bytes: Self::Bytes) -> Self {
+                Self::from_le_bytes(bytes)
+            }
+
+            #[inline]
+            fn from_be_bytes(bytes: Self::Bytes) -> Self {
+                Self::from_be_bytes(bytes)
+            }
+        }
+    };
+}
+
+native_type!(u8, PrimitiveType::UInt8);
+native_type!(u16, PrimitiveType::UInt16);
+native_type!(u32, PrimitiveType::UInt32);
+native_type!(u64, PrimitiveType::UInt64);
+native_type!(i8, PrimitiveType::Int8);
+native_type!(i16, PrimitiveType::Int16);
+native_type!(i32, PrimitiveType::Int32);
+native_type!(i64, PrimitiveType::Int64);
+native_type!(f32, PrimitiveType::Float32);
+native_type!(f64, PrimitiveType::Float64);
+native_type!(i128, PrimitiveType::Int128);
+
+/// The in-memory representation of the DayMillisecond variant of arrow's "Interval" logical type.
+#[derive(Debug, Copy, Clone, Default, PartialEq, Eq, Hash, Zeroable, Pod)]
+#[allow(non_camel_case_types)]
+#[repr(C)]
+pub struct days_ms(pub i32, pub i32);
+
+impl days_ms {
+    /// A new [`days_ms`].
+    #[inline]
+    pub fn new(days: i32, milliseconds: i32) -> Self {
+        Self(days, milliseconds)
+    }
+
+    /// The number of days
+    #[inline]
+    pub fn days(&self) -> i32 {
+        self.0
+    }
+
+    /// The number of milliseconds
+    #[inline]
+    pub fn milliseconds(&self) -> i32 {
+        self.1
+    }
+}
+
+impl NativeType for days_ms {
+    const PRIMITIVE: PrimitiveType = PrimitiveType::DaysMs;
+    type Bytes = [u8; 8];
+    #[inline]
+    fn to_le_bytes(&self) -> Self::Bytes {
+        let days = self.0.to_le_bytes();
+        let ms = self.1.to_le_bytes();
+        let mut result = [0; 8];
+        result[0] = days[0];
+        result[1] = days[1];
+        result[2] = days[2];
+        result[3] = days[3];
+        result[4] = ms[0];
+        result[5] = ms[1];
+        result[6] = ms[2];
+        result[7] = ms[3];
+        result
+    }
+
+    #[inline]
+    fn to_be_bytes(&self) -> Self::Bytes {
+        let days = self.0.to_be_bytes();
+        let ms = self.1.to_be_bytes();
+        let mut result = [0; 8];
+        result[0] = days[0];
+        result[1] = days[1];
+        result[2] = days[2];
+        result[3] = days[3];
+        result[4] = ms[0];
+        result[5] = ms[1];
+        result[6] = ms[2];
+        result[7] = ms[3];
+        result
+    }
+
+    #[inline]
+    fn from_le_bytes(bytes: Self::Bytes) -> Self {
+        let mut days = [0; 4];
+        days[0] = bytes[0];
+        days[1] = bytes[1];
+        days[2] = bytes[2];
+        days[3] = bytes[3];
+        let mut ms = [0; 4];
+        ms[0] = bytes[4];
+        ms[1] = bytes[5];
+        ms[2] = bytes[6];
+        ms[3] = bytes[7];
+        Self(i32::from_le_bytes(days), i32::from_le_bytes(ms))
+    }
+
+    #[inline]
+    fn from_be_bytes(bytes: Self::Bytes) -> Self {
+        let mut days = [0; 4];
+        days[0] = bytes[0];
+        days[1] = bytes[1];
+        days[2] = bytes[2];
+        days[3] = bytes[3];
+        let mut ms = [0; 4];
+        ms[0] = bytes[4];
+        ms[1] = bytes[5];
+        ms[2] = bytes[6];
+        ms[3] = bytes[7];
+        Self(i32::from_be_bytes(days), i32::from_be_bytes(ms))
+    }
+}
+
+/// The in-memory representation of the MonthDayNano variant of the "Interval" logical type.
+#[derive(Debug, Copy, Clone, Default, PartialEq, Eq, Hash, Zeroable, Pod)]
+#[allow(non_camel_case_types)]
+#[repr(C)]
+pub struct months_days_ns(pub i32, pub i32, pub i64);
+
+impl months_days_ns {
+    /// A new [`months_days_ns`].
+    #[inline]
+    pub fn new(months: i32, days: i32, nanoseconds: i64) -> Self {
+        Self(months, days, nanoseconds)
+    }
+
+    /// The number of months
+    #[inline]
+    pub fn months(&self) -> i32 {
+        self.0
+    }
+
+    /// The number of days
+    #[inline]
+    pub fn days(&self) -> i32 {
+        self.1
+    }
+
+    /// The number of nanoseconds
+    #[inline]
+    pub fn ns(&self) -> i64 {
+        self.2
+    }
+}
+
+impl NativeType for months_days_ns {
+    const PRIMITIVE: PrimitiveType = PrimitiveType::MonthDayNano;
+    type Bytes = [u8; 16];
+    #[inline]
+    fn to_le_bytes(&self) -> Self::Bytes {
+        let months = self.months().to_le_bytes();
+        let days = self.days().to_le_bytes();
+        let ns = self.ns().to_le_bytes();
+        let mut result = [0; 16];
+        result[0] = months[0];
+        result[1] = months[1];
+        result[2] = months[2];
+        result[3] = months[3];
+        result[4] = days[0];
+        result[5] = days[1];
+        result[6] = days[2];
+        result[7] = days[3];
+        (0..8).for_each(|i| {
+            result[8 + i] = ns[i];
+        });
+        result
+    }
+
+    #[inline]
+    fn to_be_bytes(&self) -> Self::Bytes {
+        let months = self.months().to_be_bytes();
+        let days = self.days().to_be_bytes();
+        let ns = self.ns().to_be_bytes();
+        let mut result = [0; 16];
+        result[0] = months[0];
+        result[1] = months[1];
+        result[2] = months[2];
+        result[3] = months[3];
+        result[4] = days[0];
+        result[5] = days[1];
+        result[6] = days[2];
+        result[7] = days[3];
+        (0..8).for_each(|i| {
+            result[8 + i] = ns[i];
+        });
+        result
+    }
+
+    #[inline]
+    fn from_le_bytes(bytes: Self::Bytes) -> Self {
+        let mut months = [0; 4];
+        months[0] = bytes[0];
+        months[1] = bytes[1];
+        months[2] = bytes[2];
+        months[3] = bytes[3];
+        let mut days = [0; 4];
+        days[0] = bytes[4];
+        days[1] = bytes[5];
+        days[2] = bytes[6];
+        days[3] = bytes[7];
+        let mut ns = [0; 8];
+        (0..8).for_each(|i| {
+            ns[i] = bytes[8 + i];
+        });
+        Self(
+            i32::from_le_bytes(months),
+            i32::from_le_bytes(days),
+            i64::from_le_bytes(ns),
+        )
+    }
+
+    #[inline]
+    fn from_be_bytes(bytes: Self::Bytes) -> Self {
+        let mut months = [0; 4];
+        months[0] = bytes[0];
+        months[1] = bytes[1];
+        months[2] = bytes[2];
+        months[3] = bytes[3];
+        let mut days = [0; 4];
+        days[0] = bytes[4];
+        days[1] = bytes[5];
+        days[2] = bytes[6];
+        days[3] = bytes[7];
+        let mut ns = [0; 8];
+        (0..8).for_each(|i| {
+            ns[i] = bytes[8 + i];
+        });
+        Self(
+            i32::from_be_bytes(months),
+            i32::from_be_bytes(days),
+            i64::from_be_bytes(ns),
+        )
+    }
+}
+
+impl std::fmt::Display for days_ms {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        write!(f, "{}d {}ms", self.days(), self.milliseconds())
+    }
+}
+
+impl std::fmt::Display for months_days_ns {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        write!(f, "{}m {}d {}ns", self.months(), self.days(), self.ns())
+    }
+}
+
+impl Neg for days_ms {
+    type Output = Self;
+
+    #[inline(always)]
+    fn neg(self) -> Self::Output {
+        Self::new(-self.days(), -self.milliseconds())
+    }
+}
+
+impl Neg for months_days_ns {
+    type Output = Self;
+
+    #[inline(always)]
+    fn neg(self) -> Self::Output {
+        Self::new(-self.months(), -self.days(), -self.ns())
+    }
+}
+
+/// Type representation of the Float16 physical type
+#[derive(Copy, Clone, Default, Zeroable, Pod)]
+#[allow(non_camel_case_types)]
+#[repr(C)]
+pub struct f16(pub u16);
+
+impl PartialEq for f16 {
+    #[inline]
+    fn eq(&self, other: &f16) -> bool {
+        if self.is_nan() || other.is_nan() {
+            false
+        } else {
+            (self.0 == other.0) || ((self.0 | other.0) & 0x7FFFu16 == 0)
+        }
+    }
+}
+
+// see https://github.com/starkat99/half-rs/blob/main/src/binary16.rs
+impl f16 {
+    /// The difference between 1.0 and the next largest representable number.
+    pub const EPSILON: f16 = f16(0x1400u16);
+
+    #[inline]
+    #[must_use]
+    pub(crate) const fn is_nan(self) -> bool {
+        self.0 & 0x7FFFu16 > 0x7C00u16
+    }
+
+    /// Casts from u16.
+    #[inline]
+    pub const fn from_bits(bits: u16) -> f16 {
+        f16(bits)
+    }
+
+    /// Casts to u16.
+    #[inline]
+    pub const fn to_bits(self) -> u16 {
+        self.0
+    }
+
+    /// Casts this `f16` to `f32`
+    pub fn to_f32(self) -> f32 {
+        let i = self.0;
+        // Check for signed zero
+        if i & 0x7FFFu16 == 0 {
+            return f32::from_bits((i as u32) << 16);
+        }
+
+        let half_sign = (i & 0x8000u16) as u32;
+        let half_exp = (i & 0x7C00u16) as u32;
+        let half_man = (i & 0x03FFu16) as u32;
+
+        // Check for an infinity or NaN when all exponent bits set
+        if half_exp == 0x7C00u32 {
+            // Check for signed infinity if mantissa is zero
+            if half_man == 0 {
+                let number = (half_sign << 16) | 0x7F80_0000u32;
+                return f32::from_bits(number);
+            } else {
+                // NaN, keep current mantissa but also set most significiant mantissa bit
+                let number = (half_sign << 16) | 0x7FC0_0000u32 | (half_man << 13);
+                return f32::from_bits(number);
+            }
+        }
+
+        // Calculate single-precision components with adjusted exponent
+        let sign = half_sign << 16;
+        // Unbias exponent
+        let unbiased_exp = ((half_exp as i32) >> 10) - 15;
+
+        // Check for subnormals, which will be normalized by adjusting exponent
+        if half_exp == 0 {
+            // Calculate how much to adjust the exponent by
+            let e = (half_man as u16).leading_zeros() - 6;
+
+            // Rebias and adjust exponent
+            let exp = (127 - 15 - e) << 23;
+            let man = (half_man << (14 + e)) & 0x7F_FF_FFu32;
+            return f32::from_bits(sign | exp | man);
+        }
+
+        // Rebias exponent for a normalized normal
+        let exp = ((unbiased_exp + 127) as u32) << 23;
+        let man = (half_man & 0x03FFu32) << 13;
+        f32::from_bits(sign | exp | man)
+    }
+
+    /// Casts an `f32` into `f16`
+    pub fn from_f32(value: f32) -> Self {
+        let x: u32 = value.to_bits();
+
+        // Extract IEEE754 components
+        let sign = x & 0x8000_0000u32;
+        let exp = x & 0x7F80_0000u32;
+        let man = x & 0x007F_FFFFu32;
+
+        // Check for all exponent bits being set, which is Infinity or NaN
+        if exp == 0x7F80_0000u32 {
+            // Set mantissa MSB for NaN (and also keep shifted mantissa bits)
+            let nan_bit = if man == 0 { 0 } else { 0x0200u32 };
+            return f16(((sign >> 16) | 0x7C00u32 | nan_bit | (man >> 13)) as u16);
+        }
+
+        // The number is normalized, start assembling half precision version
+        let half_sign = sign >> 16;
+        // Unbias the exponent, then bias for half precision
+        let unbiased_exp = ((exp >> 23) as i32) - 127;
+        let half_exp = unbiased_exp + 15;
+
+        // Check for exponent overflow, return +infinity
+        if half_exp >= 0x1F {
+            return f16((half_sign | 0x7C00u32) as u16);
+        }
+
+        // Check for underflow
+        if half_exp <= 0 {
+            // Check mantissa for what we can do
+            if 14 - half_exp > 24 {
+                // No rounding possibility, so this is a full underflow, return signed zero
+                return f16(half_sign as u16);
+            }
+            // Don't forget about hidden leading mantissa bit when assembling mantissa
+            let man = man | 0x0080_0000u32;
+            let mut half_man = man >> (14 - half_exp);
+            // Check for rounding (see comment above functions)
+            let round_bit = 1 << (13 - half_exp);
+            if (man & round_bit) != 0 && (man & (3 * round_bit - 1)) != 0 {
+                half_man += 1;
+            }
+            // No exponent for subnormals
+            return f16((half_sign | half_man) as u16);
+        }
+
+        // Rebias the exponent
+        let half_exp = (half_exp as u32) << 10;
+        let half_man = man >> 13;
+        // Check for rounding (see comment above functions)
+        let round_bit = 0x0000_1000u32;
+        if (man & round_bit) != 0 && (man & (3 * round_bit - 1)) != 0 {
+            // Round it
+            f16(((half_sign | half_exp | half_man) + 1) as u16)
+        } else {
+            f16((half_sign | half_exp | half_man) as u16)
+        }
+    }
+}
+
+impl std::fmt::Debug for f16 {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        write!(f, "{:?}", self.to_f32())
+    }
+}
+
+impl std::fmt::Display for f16 {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        write!(f, "{}", self.to_f32())
+    }
+}
+
+impl NativeType for f16 {
+    const PRIMITIVE: PrimitiveType = PrimitiveType::Float16;
+    type Bytes = [u8; 2];
+    #[inline]
+    fn to_le_bytes(&self) -> Self::Bytes {
+        self.0.to_le_bytes()
+    }
+
+    #[inline]
+    fn to_be_bytes(&self) -> Self::Bytes {
+        self.0.to_be_bytes()
+    }
+
+    #[inline]
+    fn from_be_bytes(bytes: Self::Bytes) -> Self {
+        Self(u16::from_be_bytes(bytes))
+    }
+
+    #[inline]
+    fn from_le_bytes(bytes: Self::Bytes) -> Self {
+        Self(u16::from_le_bytes(bytes))
+    }
+}
+
+/// Physical representation of a decimal
+#[derive(Clone, Copy, Default, Eq, Hash, PartialEq, PartialOrd, Ord)]
+#[allow(non_camel_case_types)]
+#[repr(C)]
+pub struct i256(pub ethnum::I256);
+
+impl i256 {
+    /// Returns a new [`i256`] from two `i128`.
+    pub fn from_words(hi: i128, lo: i128) -> Self {
+        Self(ethnum::I256::from_words(hi, lo))
+    }
+}
+
+impl Neg for i256 {
+    type Output = Self;
+
+    #[inline]
+    fn neg(self) -> Self::Output {
+        let (a, b) = self.0.into_words();
+        Self(ethnum::I256::from_words(-a, b))
+    }
+}
+
+impl std::fmt::Debug for i256 {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        write!(f, "{:?}", self.0)
+    }
+}
+
+impl std::fmt::Display for i256 {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        write!(f, "{}", self.0)
+    }
+}
+
+unsafe impl Pod for i256 {}
+unsafe impl Zeroable for i256 {}
+
+impl NativeType for i256 {
+    const PRIMITIVE: PrimitiveType = PrimitiveType::Int256;
+
+    type Bytes = [u8; 32];
+
+    #[inline]
+    fn to_le_bytes(&self) -> Self::Bytes {
+        let mut bytes = [0u8; 32];
+        let (a, b) = self.0.into_words();
+        let a = a.to_le_bytes();
+        (0..16).for_each(|i| {
+            bytes[i] = a[i];
+        });
+
+        let b = b.to_le_bytes();
+        (0..16).for_each(|i| {
+            bytes[i + 16] = b[i];
+        });
+
+        bytes
+    }
+
+    #[inline]
+    fn to_be_bytes(&self) -> Self::Bytes {
+        let mut bytes = [0u8; 32];
+        let (a, b) = self.0.into_words();
+
+        let a = a.to_be_bytes();
+        (0..16).for_each(|i| {
+            bytes[i] = a[i];
+        });
+
+        let b = b.to_be_bytes();
+        (0..16).for_each(|i| {
+            bytes[i + 16] = b[i];
+        });
+
+        bytes
+    }
+
+    #[inline]
+    fn from_be_bytes(bytes: Self::Bytes) -> Self {
+        let (a, b) = bytes.split_at(16);
+        let a: [u8; 16] = a.try_into().unwrap();
+        let b: [u8; 16] = b.try_into().unwrap();
+        let a = i128::from_be_bytes(a);
+        let b = i128::from_be_bytes(b);
+        Self(ethnum::I256::from_words(a, b))
+    }
+
+    #[inline]
+    fn from_le_bytes(bytes: Self::Bytes) -> Self {
+        let (b, a) = bytes.split_at(16);
+        let a: [u8; 16] = a.try_into().unwrap();
+        let b: [u8; 16] = b.try_into().unwrap();
+        let a = i128::from_le_bytes(a);
+        let b = i128::from_le_bytes(b);
+        Self(ethnum::I256::from_words(a, b))
+    }
+}
+
+#[cfg(test)]
+mod test {
+    use super::*;
+    #[test]
+    fn test_f16_to_f32() {
+        let f = f16::from_f32(7.0);
+        assert_eq!(f.to_f32(), 7.0f32);
+
+        // 7.1 is NOT exactly representable in 16-bit, it's rounded
+        let f = f16::from_f32(7.1);
+        let diff = (f.to_f32() - 7.1f32).abs();
+        // diff must be <= 4 * EPSILON, as 7 has two more significant bits than 1
+        assert!(diff <= 4.0 * f16::EPSILON.to_f32());
+
+        assert_eq!(f16(0x0000_0001).to_f32(), 2.0f32.powi(-24));
+        assert_eq!(f16(0x0000_0005).to_f32(), 5.0 * 2.0f32.powi(-24));
+
+        assert_eq!(f16(0x0000_0001), f16::from_f32(2.0f32.powi(-24)));
+        assert_eq!(f16(0x0000_0005), f16::from_f32(5.0 * 2.0f32.powi(-24)));
+
+        assert_eq!(format!("{}", f16::from_f32(7.0)), "7".to_string());
+        assert_eq!(format!("{:?}", f16::from_f32(7.0)), "7.0".to_string());
+    }
+}
diff --git a/crates/nano-arrow/src/types/offset.rs b/crates/nano-arrow/src/types/offset.rs
new file mode 100644
index 000000000000..e68bb7ceb6bd
--- /dev/null
+++ b/crates/nano-arrow/src/types/offset.rs
@@ -0,0 +1,16 @@
+use super::Index;
+
+/// Sealed trait describing the subset (`i32` and `i64`) of [`Index`] that can be used
+/// as offsets of variable-length Arrow arrays.
+pub trait Offset: super::private::Sealed + Index {
+    /// Whether it is `i32` (false) or `i64` (true).
+    const IS_LARGE: bool;
+}
+
+impl Offset for i32 {
+    const IS_LARGE: bool = false;
+}
+
+impl Offset for i64 {
+    const IS_LARGE: bool = true;
+}
diff --git a/crates/nano-arrow/src/types/simd/mod.rs b/crates/nano-arrow/src/types/simd/mod.rs
new file mode 100644
index 000000000000..d906c9d25e95
--- /dev/null
+++ b/crates/nano-arrow/src/types/simd/mod.rs
@@ -0,0 +1,167 @@
+//! Contains traits and implementations of multi-data used in SIMD.
+//! The actual representation is driven by the feature flag `"simd"`, which, if set,
+//! uses [`std::simd`].
+use super::{days_ms, f16, i256, months_days_ns, BitChunk, BitChunkIter, NativeType};
+
+/// Describes the ability to convert itself from a [`BitChunk`].
+pub trait FromMaskChunk<T> {
+    /// Convert itself from a slice.
+    fn from_chunk(v: T) -> Self;
+}
+
+/// A struct that lends itself well to be compiled leveraging SIMD
+/// # Safety
+/// The `NativeType` and the `NativeSimd` must have possible a matching alignment.
+/// e.g. slicing `&[NativeType]` by `align_of<NativeSimd>()` must be properly aligned/safe.
+pub unsafe trait NativeSimd: Sized + Default + Copy {
+    /// Number of lanes
+    const LANES: usize;
+    /// The [`NativeType`] of this struct. E.g. `f32` for a `NativeSimd = f32x16`.
+    type Native: NativeType;
+    /// The type holding bits for masks.
+    type Chunk: BitChunk;
+    /// Type used for masking.
+    type Mask: FromMaskChunk<Self::Chunk>;
+
+    /// Sets values to `default` based on `mask`.
+    fn select(self, mask: Self::Mask, default: Self) -> Self;
+
+    /// Convert itself from a slice.
+    /// # Panics
+    /// * iff `v.len()` != `T::LANES`
+    fn from_chunk(v: &[Self::Native]) -> Self;
+
+    /// creates a new Self from `v` by populating items from `v` up to its length.
+    /// Items from `v` at positions larger than the number of lanes are ignored;
+    /// remaining items are populated with `remaining`.
+    fn from_incomplete_chunk(v: &[Self::Native], remaining: Self::Native) -> Self;
+
+    /// Returns a tuple of 3 items whose middle item is itself, and the remaining
+    /// are the head and tail of the un-aligned parts.
+    fn align(values: &[Self::Native]) -> (&[Self::Native], &[Self], &[Self::Native]);
+}
+
+/// Trait implemented by some [`NativeType`] that have a SIMD representation.
+pub trait Simd: NativeType {
+    /// The SIMD type associated with this trait.
+    /// This type supports SIMD operations
+    type Simd: NativeSimd<Native = Self>;
+}
+
+#[cfg(not(feature = "simd"))]
+mod native;
+#[cfg(not(feature = "simd"))]
+pub use native::*;
+#[cfg(feature = "simd")]
+mod packed;
+#[cfg(feature = "simd")]
+pub use packed::*;
+
+macro_rules! native_simd {
+    ($name:tt, $type:ty, $lanes:expr, $mask:ty) => {
+        /// Multi-Data correspondence of the native type
+        #[allow(non_camel_case_types)]
+        #[derive(Copy, Clone)]
+        pub struct $name(pub [$type; $lanes]);
+
+        unsafe impl NativeSimd for $name {
+            const LANES: usize = $lanes;
+            type Native = $type;
+            type Chunk = $mask;
+            type Mask = $mask;
+
+            #[inline]
+            fn select(self, mask: $mask, default: Self) -> Self {
+                let mut reduced = default;
+                let iter = BitChunkIter::new(mask, Self::LANES);
+                for (i, b) in (0..Self::LANES).zip(iter) {
+                    reduced[i] = if b { self[i] } else { reduced[i] };
+                }
+                reduced
+            }
+
+            #[inline]
+            fn from_chunk(v: &[$type]) -> Self {
+                ($name)(v.try_into().unwrap())
+            }
+
+            #[inline]
+            fn from_incomplete_chunk(v: &[$type], remaining: $type) -> Self {
+                let mut a = [remaining; $lanes];
+                a.iter_mut().zip(v.iter()).for_each(|(a, b)| *a = *b);
+                Self(a)
+            }
+
+            #[inline]
+            fn align(values: &[Self::Native]) -> (&[Self::Native], &[Self], &[Self::Native]) {
+                unsafe { values.align_to::<Self>() }
+            }
+        }
+
+        impl std::ops::Index<usize> for $name {
+            type Output = $type;
+
+            #[inline]
+            fn index(&self, index: usize) -> &Self::Output {
+                &self.0[index]
+            }
+        }
+
+        impl std::ops::IndexMut<usize> for $name {
+            #[inline]
+            fn index_mut(&mut self, index: usize) -> &mut Self::Output {
+                &mut self.0[index]
+            }
+        }
+
+        impl Default for $name {
+            #[inline]
+            fn default() -> Self {
+                ($name)([<$type>::default(); $lanes])
+            }
+        }
+    };
+}
+
+pub(super) use native_simd;
+
+// Types do not have specific intrinsics and thus SIMD can't be specialized.
+// Therefore, we can declare their MD representation as `[$t; 8]` irrespectively
+// of how they are represented in the different channels.
+native_simd!(f16x32, f16, 32, u32);
+native_simd!(days_msx8, days_ms, 8, u8);
+native_simd!(months_days_nsx8, months_days_ns, 8, u8);
+native_simd!(i128x8, i128, 8, u8);
+native_simd!(i256x8, i256, 8, u8);
+
+// In the native implementation, a mask is 1 bit wide, as per AVX512.
+impl<T: BitChunk> FromMaskChunk<T> for T {
+    #[inline]
+    fn from_chunk(v: T) -> Self {
+        v
+    }
+}
+
+macro_rules! native {
+    ($type:ty, $simd:ty) => {
+        impl Simd for $type {
+            type Simd = $simd;
+        }
+    };
+}
+
+native!(u8, u8x64);
+native!(u16, u16x32);
+native!(u32, u32x16);
+native!(u64, u64x8);
+native!(i8, i8x64);
+native!(i16, i16x32);
+native!(i32, i32x16);
+native!(i64, i64x8);
+native!(f16, f16x32);
+native!(f32, f32x16);
+native!(f64, f64x8);
+native!(i128, i128x8);
+native!(i256, i256x8);
+native!(days_ms, days_msx8);
+native!(months_days_ns, months_days_nsx8);
diff --git a/crates/nano-arrow/src/types/simd/native.rs b/crates/nano-arrow/src/types/simd/native.rs
new file mode 100644
index 000000000000..af31b8b26bc0
--- /dev/null
+++ b/crates/nano-arrow/src/types/simd/native.rs
@@ -0,0 +1,16 @@
+use std::convert::TryInto;
+
+use super::*;
+use crate::types::BitChunkIter;
+
+native_simd!(u8x64, u8, 64, u64);
+native_simd!(u16x32, u16, 32, u32);
+native_simd!(u32x16, u32, 16, u16);
+native_simd!(u64x8, u64, 8, u8);
+native_simd!(i8x64, i8, 64, u64);
+native_simd!(i16x32, i16, 32, u32);
+native_simd!(i32x16, i32, 16, u16);
+native_simd!(i64x8, i64, 8, u8);
+native_simd!(f16x32, f16, 32, u32);
+native_simd!(f32x16, f32, 16, u16);
+native_simd!(f64x8, f64, 8, u8);
diff --git a/crates/nano-arrow/src/types/simd/packed.rs b/crates/nano-arrow/src/types/simd/packed.rs
new file mode 100644
index 000000000000..0d95b68882aa
--- /dev/null
+++ b/crates/nano-arrow/src/types/simd/packed.rs
@@ -0,0 +1,197 @@
+pub use std::simd::{
+    f32x16, f32x8, f64x8, i16x32, i16x8, i32x16, i32x8, i64x8, i8x64, i8x8, mask32x16 as m32x16,
+    mask64x8 as m64x8, mask8x64 as m8x64, u16x32, u16x8, u32x16, u32x8, u64x8, u8x64, u8x8,
+    SimdPartialEq,
+};
+
+/// Vector of 32 16-bit masks
+#[allow(non_camel_case_types)]
+pub type m16x32 = std::simd::Mask<i16, 32>;
+
+use super::*;
+
+macro_rules! simd {
+    ($name:tt, $type:ty, $lanes:expr, $chunk:ty, $mask:tt) => {
+        unsafe impl NativeSimd for $name {
+            const LANES: usize = $lanes;
+            type Native = $type;
+            type Chunk = $chunk;
+            type Mask = $mask;
+
+            #[inline]
+            fn select(self, mask: $mask, default: Self) -> Self {
+                mask.select(self, default)
+            }
+
+            #[inline]
+            fn from_chunk(v: &[$type]) -> Self {
+                <$name>::from_slice(v)
+            }
+
+            #[inline]
+            fn from_incomplete_chunk(v: &[$type], remaining: $type) -> Self {
+                let mut a = [remaining; $lanes];
+                a.iter_mut().zip(v.iter()).for_each(|(a, b)| *a = *b);
+                <$name>::from_chunk(a.as_ref())
+            }
+
+            #[inline]
+            fn align(values: &[Self::Native]) -> (&[Self::Native], &[Self], &[Self::Native]) {
+                unsafe { values.align_to::<Self>() }
+            }
+        }
+    };
+}
+
+simd!(u8x64, u8, 64, u64, m8x64);
+simd!(u16x32, u16, 32, u32, m16x32);
+simd!(u32x16, u32, 16, u16, m32x16);
+simd!(u64x8, u64, 8, u8, m64x8);
+simd!(i8x64, i8, 64, u64, m8x64);
+simd!(i16x32, i16, 32, u32, m16x32);
+simd!(i32x16, i32, 16, u16, m32x16);
+simd!(i64x8, i64, 8, u8, m64x8);
+simd!(f32x16, f32, 16, u16, m32x16);
+simd!(f64x8, f64, 8, u8, m64x8);
+
+macro_rules! chunk_macro {
+    ($type:ty, $chunk:ty, $simd:ty, $mask:tt, $m:expr) => {
+        impl FromMaskChunk<$chunk> for $mask {
+            #[inline]
+            fn from_chunk(chunk: $chunk) -> Self {
+                ($m)(chunk)
+            }
+        }
+    };
+}
+
+chunk_macro!(u8, u64, u8x64, m8x64, from_chunk_u64);
+chunk_macro!(u16, u32, u16x32, m16x32, from_chunk_u32);
+chunk_macro!(u32, u16, u32x16, m32x16, from_chunk_u16);
+chunk_macro!(u64, u8, u64x8, m64x8, from_chunk_u8);
+
+#[inline]
+fn from_chunk_u8(chunk: u8) -> m64x8 {
+    let idx = u64x8::from_array([1, 2, 4, 8, 16, 32, 64, 128]);
+    let vecmask = u64x8::splat(chunk as u64);
+
+    (idx & vecmask).simd_eq(idx)
+}
+
+#[inline]
+fn from_chunk_u16(chunk: u16) -> m32x16 {
+    let idx = u32x16::from_array([
+        1, 2, 4, 8, 16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192, 16384, 32768,
+    ]);
+    let vecmask = u32x16::splat(chunk as u32);
+
+    (idx & vecmask).simd_eq(idx)
+}
+
+#[inline]
+fn from_chunk_u32(chunk: u32) -> m16x32 {
+    let idx = u16x32::from_array([
+        1, 2, 4, 8, 16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192, 16384, 32768, 1, 2, 4, 8,
+        16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192, 16384, 32768,
+    ]);
+    let left = u16x32::from_chunk(&[
+        1, 2, 4, 8, 16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192, 16384, 32768, 0, 0, 0, 0, 0,
+        0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
+    ]);
+    let right = u16x32::from_chunk(&[
+        0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 2, 4, 8, 16, 32, 64, 128, 256, 512,
+        1024, 2048, 4096, 8192, 16384, 32768,
+    ]);
+
+    let a = chunk.to_ne_bytes();
+    let a1 = u16::from_ne_bytes([a[2], a[3]]);
+    let a2 = u16::from_ne_bytes([a[0], a[1]]);
+
+    let vecmask1 = u16x32::splat(a1);
+    let vecmask2 = u16x32::splat(a2);
+
+    (idx & left & vecmask1).simd_eq(idx) | (idx & right & vecmask2).simd_eq(idx)
+}
+
+#[inline]
+fn from_chunk_u64(chunk: u64) -> m8x64 {
+    let idx = u8x64::from_array([
+        1, 2, 4, 8, 16, 32, 64, 128, 1, 2, 4, 8, 16, 32, 64, 128, 1, 2, 4, 8, 16, 32, 64, 128, 1,
+        2, 4, 8, 16, 32, 64, 128, 1, 2, 4, 8, 16, 32, 64, 128, 1, 2, 4, 8, 16, 32, 64, 128, 1, 2,
+        4, 8, 16, 32, 64, 128, 1, 2, 4, 8, 16, 32, 64, 128,
+    ]);
+    let idxs = [
+        u8x64::from_chunk(&[
+            1, 2, 4, 8, 16, 32, 64, 128, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
+            0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
+            0, 0, 0, 0, 0, 0, 0, 0,
+        ]),
+        u8x64::from_chunk(&[
+            0, 0, 0, 0, 0, 0, 0, 0, 1, 2, 4, 8, 16, 32, 64, 128, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
+            0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
+            0, 0, 0, 0, 0, 0, 0, 0,
+        ]),
+        u8x64::from_chunk(&[
+            0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 2, 4, 8, 16, 32, 64, 128, 0, 0, 0,
+            0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
+            0, 0, 0, 0, 0, 0, 0, 0,
+        ]),
+        u8x64::from_chunk(&[
+            0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 2, 4, 8, 16,
+            32, 64, 128, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
+            0, 0, 0, 0, 0, 0, 0,
+        ]),
+        u8x64::from_chunk(&[
+            0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
+            0, 0, 0, 1, 2, 4, 8, 16, 32, 64, 128, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
+            0, 0, 0, 0, 0, 0, 0, 0,
+        ]),
+        u8x64::from_chunk(&[
+            0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
+            0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 2, 4, 8, 16, 32, 64, 128, 0, 0, 0, 0, 0, 0, 0, 0,
+            0, 0, 0, 0, 0, 0, 0, 0,
+        ]),
+        u8x64::from_chunk(&[
+            0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
+            0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 2, 4, 8, 16, 32, 64, 128,
+            0, 0, 0, 0, 0, 0, 0, 0,
+        ]),
+        u8x64::from_chunk(&[
+            0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
+            0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 2,
+            4, 8, 16, 32, 64, 128,
+        ]),
+    ];
+
+    let a = chunk.to_ne_bytes();
+
+    let mut result = m8x64::default();
+    for i in 0..8 {
+        result |= (idxs[i] & u8x64::splat(a[i])).simd_eq(idx)
+    }
+
+    result
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn test_basic1() {
+        let a = 0b00000001000000010000000100000001u32;
+        let a = from_chunk_u32(a);
+        for i in 0..32 {
+            assert_eq!(a.test(i), i % 8 == 0)
+        }
+    }
+
+    #[test]
+    fn test_basic2() {
+        let a = 0b0000000100000001000000010000000100000001000000010000000100000001u64;
+        let a = from_chunk_u64(a);
+        for i in 0..64 {
+            assert_eq!(a.test(i), i % 8 == 0)
+        }
+    }
+}
diff --git a/crates/nano-arrow/src/util/bench_util.rs b/crates/nano-arrow/src/util/bench_util.rs
new file mode 100644
index 000000000000..59fb88b198fc
--- /dev/null
+++ b/crates/nano-arrow/src/util/bench_util.rs
@@ -0,0 +1,99 @@
+//! Utilities for benchmarking
+
+use rand::distributions::{Alphanumeric, Distribution, Standard};
+use rand::rngs::StdRng;
+use rand::{Rng, SeedableRng};
+
+use crate::array::*;
+use crate::offset::Offset;
+use crate::types::NativeType;
+
+/// Returns fixed seedable RNG
+pub fn seedable_rng() -> StdRng {
+    StdRng::seed_from_u64(42)
+}
+
+/// Creates an random (but fixed-seeded) array of a given size and null density
+pub fn create_primitive_array<T>(size: usize, null_density: f32) -> PrimitiveArray<T>
+where
+    T: NativeType,
+    Standard: Distribution<T>,
+{
+    let mut rng = seedable_rng();
+
+    (0..size)
+        .map(|_| {
+            if rng.gen::<f32>() < null_density {
+                None
+            } else {
+                Some(rng.gen())
+            }
+        })
+        .collect::<PrimitiveArray<T>>()
+}
+
+/// Creates a new [`PrimitiveArray`] from random values with a pre-set seed.
+pub fn create_primitive_array_with_seed<T>(
+    size: usize,
+    null_density: f32,
+    seed: u64,
+) -> PrimitiveArray<T>
+where
+    T: NativeType,
+    Standard: Distribution<T>,
+{
+    let mut rng = StdRng::seed_from_u64(seed);
+
+    (0..size)
+        .map(|_| {
+            if rng.gen::<f32>() < null_density {
+                None
+            } else {
+                Some(rng.gen())
+            }
+        })
+        .collect::<PrimitiveArray<T>>()
+}
+
+/// Creates an random (but fixed-seeded) array of a given size and null density
+pub fn create_boolean_array(size: usize, null_density: f32, true_density: f32) -> BooleanArray
+where
+    Standard: Distribution<bool>,
+{
+    let mut rng = seedable_rng();
+    (0..size)
+        .map(|_| {
+            if rng.gen::<f32>() < null_density {
+                None
+            } else {
+                let value = rng.gen::<f32>() < true_density;
+                Some(value)
+            }
+        })
+        .collect()
+}
+
+/// Creates an random (but fixed-seeded) [`Utf8Array`] of a given length, number of characters and null density.
+pub fn create_string_array<O: Offset>(
+    length: usize,
+    size: usize,
+    null_density: f32,
+    seed: u64,
+) -> Utf8Array<O> {
+    let mut rng = StdRng::seed_from_u64(seed);
+
+    (0..length)
+        .map(|_| {
+            if rng.gen::<f32>() < null_density {
+                None
+            } else {
+                let value = (&mut rng)
+                    .sample_iter(&Alphanumeric)
+                    .take(size)
+                    .map(char::from)
+                    .collect::<String>();
+                Some(value)
+            }
+        })
+        .collect()
+}
diff --git a/crates/nano-arrow/src/util/lexical.rs b/crates/nano-arrow/src/util/lexical.rs
new file mode 100644
index 000000000000..047986cbbedd
--- /dev/null
+++ b/crates/nano-arrow/src/util/lexical.rs
@@ -0,0 +1,42 @@
+/// Converts numeric type to a `String`
+#[inline]
+pub fn lexical_to_bytes<N: lexical_core::ToLexical>(n: N) -> Vec<u8> {
+    let mut buf = Vec::<u8>::with_capacity(N::FORMATTED_SIZE_DECIMAL);
+    lexical_to_bytes_mut(n, &mut buf);
+    buf
+}
+
+/// Converts numeric type to a `String`
+#[inline]
+pub fn lexical_to_bytes_mut<N: lexical_core::ToLexical>(n: N, buf: &mut Vec<u8>) {
+    buf.clear();
+    buf.reserve(N::FORMATTED_SIZE_DECIMAL);
+    unsafe {
+        // JUSTIFICATION
+        //  Benefit
+        //      Allows using the faster serializer lexical core and convert to string
+        //  Soundness
+        //      Length of buf is set as written length afterwards. lexical_core
+        //      creates a valid string, so doesn't need to be checked.
+        let slice = std::slice::from_raw_parts_mut(buf.as_mut_ptr(), buf.capacity());
+
+        //  Safety:
+        //  Omits an unneeded bound check as we just ensured that we reserved `N::FORMATTED_SIZE_DECIMAL`
+        #[cfg(debug_assertions)]
+        {
+            let len = lexical_core::write(n, slice).len();
+            buf.set_len(len);
+        }
+        #[cfg(not(debug_assertions))]
+        {
+            let len = lexical_core::write_unchecked(n, slice).len();
+            buf.set_len(len);
+        }
+    }
+}
+
+/// Converts numeric type to a `String`
+#[inline]
+pub fn lexical_to_string<N: lexical_core::ToLexical>(n: N) -> String {
+    unsafe { String::from_utf8_unchecked(lexical_to_bytes(n)) }
+}
diff --git a/crates/nano-arrow/src/util/mod.rs b/crates/nano-arrow/src/util/mod.rs
new file mode 100644
index 000000000000..90642b151a1a
--- /dev/null
+++ b/crates/nano-arrow/src/util/mod.rs
@@ -0,0 +1,24 @@
+//! Misc utilities used in different places in the crate.
+
+#[cfg(any(
+    feature = "compute",
+    feature = "io_csv_write",
+    feature = "io_csv_read",
+    feature = "io_json",
+    feature = "io_json_write",
+    feature = "compute_cast"
+))]
+mod lexical;
+#[cfg(any(
+    feature = "compute",
+    feature = "io_csv_write",
+    feature = "io_csv_read",
+    feature = "io_json",
+    feature = "io_json_write",
+    feature = "compute_cast"
+))]
+pub use lexical::*;
+
+#[cfg(feature = "benchmarks")]
+#[cfg_attr(docsrs, doc(cfg(feature = "benchmarks")))]
+pub mod bench_util;
diff --git a/crates/polars-arrow/Cargo.toml b/crates/polars-arrow/Cargo.toml
index 233987f78120..ac44783ddd46 100644
--- a/crates/polars-arrow/Cargo.toml
+++ b/crates/polars-arrow/Cargo.toml
@@ -34,6 +34,5 @@ compute = ["arrow/compute_cast"]
 temporal = ["arrow/compute_temporal"]
 bigidx = []
 performant = []
-like = ["arrow/compute_like"]
 timezones = ["chrono-tz", "chrono"]
 simd = []
diff --git a/crates/polars-core/Cargo.toml b/crates/polars-core/Cargo.toml
index 174e3cfc0a9a..eb6c691a302f 100644
--- a/crates/polars-core/Cargo.toml
+++ b/crates/polars-core/Cargo.toml
@@ -64,7 +64,7 @@ lazy = []
 performant = ["polars-arrow/performant", "reinterpret"]
 
 # extra utilities for Utf8Chunked
-strings = ["regex", "polars-arrow/strings", "arrow/compute_substring", "polars-error/regex"]
+strings = ["regex", "polars-arrow/strings", "polars-error/regex"]
 # support for ObjectChunked<T> (downcastable Series of any type)
 object = ["serde_json"]
 
diff --git a/crates/polars-io/Cargo.toml b/crates/polars-io/Cargo.toml
index fb6f54cd1695..950abb8a225b 100644
--- a/crates/polars-io/Cargo.toml
+++ b/crates/polars-io/Cargo.toml
@@ -37,7 +37,7 @@ regex = { workspace = true }
 serde = { workspace = true, features = ["derive"], optional = true }
 serde_json = { version = "1", default-features = false, features = ["alloc", "raw_value"], optional = true }
 simd-json = { workspace = true, optional = true }
-simdutf8 = { version = "0.1", optional = true }
+simdutf8 = { workspace = true, optional = true }
 tokio = { version = "1.26", features = ["net"], optional = true }
 tokio-util = { version = "0.7.8", features = ["io", "io-util"], optional = true }
 url = { workspace = true, optional = true }
@@ -52,7 +52,6 @@ tempdir = "0.3.7"
 default = ["decompress"]
 # support for arrows json parsing
 json = [
-  "arrow/io_json_write",
   "polars-json",
   "simd-json",
   "lexical",
diff --git a/crates/polars-io/src/json/mod.rs b/crates/polars-io/src/json/mod.rs
index c5c7d8fe503f..f64709a52a19 100644
--- a/crates/polars-io/src/json/mod.rs
+++ b/crates/polars-io/src/json/mod.rs
@@ -67,7 +67,6 @@ use std::ops::Deref;
 
 use arrow::array::StructArray;
 pub use arrow::error::Result as ArrowResult;
-pub use arrow::io::json;
 use polars_arrow::conversion::chunk_to_struct;
 use polars_arrow::utils::CustomIterTools;
 use polars_core::error::to_compute_err;
@@ -141,13 +140,14 @@ where
 
         match self.json_format {
             JsonFormat::JsonLines => {
-                let serializer = arrow_ndjson::write::Serializer::new(batches, vec![]);
-                let writer = arrow_ndjson::write::FileWriter::new(&mut self.buffer, serializer);
+                let serializer = polars_json::ndjson::write::Serializer::new(batches, vec![]);
+                let writer =
+                    polars_json::ndjson::write::FileWriter::new(&mut self.buffer, serializer);
                 writer.collect::<ArrowResult<()>>()?;
             },
             JsonFormat::Json => {
-                let serializer = json::write::Serializer::new(batches, vec![]);
-                json::write::write(&mut self.buffer, serializer)?;
+                let serializer = polars_json::json::write::Serializer::new(batches, vec![]);
+                polars_json::json::write::write(&mut self.buffer, serializer)?;
             },
         }
 
diff --git a/crates/polars-io/src/ndjson/core.rs b/crates/polars-io/src/ndjson/core.rs
index 67edf90558f0..dda5108d2f9c 100644
--- a/crates/polars-io/src/ndjson/core.rs
+++ b/crates/polars-io/src/ndjson/core.rs
@@ -3,7 +3,6 @@ use std::io::Cursor;
 use std::path::PathBuf;
 
 pub use arrow::array::StructArray;
-pub use arrow::io::ndjson as arrow_ndjson;
 use num_traits::pow::Pow;
 use polars_core::prelude::*;
 use polars_core::utils::accumulate_dataframes_vertical;
diff --git a/crates/polars-json/Cargo.toml b/crates/polars-json/Cargo.toml
index 49018673e71e..cf86ac23e607 100644
--- a/crates/polars-json/Cargo.toml
+++ b/crates/polars-json/Cargo.toml
@@ -15,8 +15,11 @@ polars-utils = { workspace = true }
 
 ahash = { workspace = true }
 arrow = { workspace = true }
+chrono = { workpace = true }
 fallible-streaming-iterator = { version = "0.1" }
 hashbrown = { workspace = true }
 indexmap = { workspace = true }
+lexical-core = { version = "0.8" }
 num-traits = { workspace = true }
 simd-json = { workspace = true }
+streaming-iterator = { workspace = true }
diff --git a/crates/polars-json/src/json/mod.rs b/crates/polars-json/src/json/mod.rs
index 1ab9c2dd15ce..d39d7513c431 100644
--- a/crates/polars-json/src/json/mod.rs
+++ b/crates/polars-json/src/json/mod.rs
@@ -5,3 +5,4 @@ pub use deserialize::deserialize;
 pub use infer_schema::{infer, infer_records_schema};
 use polars_error::*;
 use polars_utils::aliases::*;
+pub mod write;
diff --git a/crates/polars-json/src/json/write/mod.rs b/crates/polars-json/src/json/write/mod.rs
new file mode 100644
index 000000000000..343bae73e520
--- /dev/null
+++ b/crates/polars-json/src/json/write/mod.rs
@@ -0,0 +1,157 @@
+//! APIs to write to JSON
+mod serialize;
+mod utf8;
+
+use std::io::Write;
+
+use arrow::array::Array;
+use arrow::chunk::Chunk;
+use arrow::datatypes::Schema;
+use arrow::error::Error;
+use arrow::io::iterator::StreamingIterator;
+pub use fallible_streaming_iterator::*;
+pub(crate) use serialize::new_serializer;
+use serialize::serialize;
+
+/// [`FallibleStreamingIterator`] that serializes an [`Array`] to bytes of valid JSON
+/// # Implementation
+/// Advancing this iterator CPU-bounded
+#[derive(Debug, Clone)]
+pub struct Serializer<A, I>
+where
+    A: AsRef<dyn Array>,
+    I: Iterator<Item = Result<A, Error>>,
+{
+    arrays: I,
+    buffer: Vec<u8>,
+}
+
+impl<A, I> Serializer<A, I>
+where
+    A: AsRef<dyn Array>,
+    I: Iterator<Item = Result<A, Error>>,
+{
+    /// Creates a new [`Serializer`].
+    pub fn new(arrays: I, buffer: Vec<u8>) -> Self {
+        Self { arrays, buffer }
+    }
+}
+
+impl<A, I> FallibleStreamingIterator for Serializer<A, I>
+where
+    A: AsRef<dyn Array>,
+    I: Iterator<Item = Result<A, Error>>,
+{
+    type Item = [u8];
+
+    type Error = Error;
+
+    fn advance(&mut self) -> Result<(), Error> {
+        self.buffer.clear();
+        self.arrays
+            .next()
+            .map(|maybe_array| maybe_array.map(|array| serialize(array.as_ref(), &mut self.buffer)))
+            .transpose()?;
+        Ok(())
+    }
+
+    fn get(&self) -> Option<&Self::Item> {
+        if !self.buffer.is_empty() {
+            Some(&self.buffer)
+        } else {
+            None
+        }
+    }
+}
+
+/// [`FallibleStreamingIterator`] that serializes a [`Chunk`] into bytes of JSON
+/// in a (pandas-compatible) record-oriented format.
+///
+/// # Implementation
+/// Advancing this iterator is CPU-bounded.
+pub struct RecordSerializer<'a> {
+    schema: Schema,
+    index: usize,
+    end: usize,
+    iterators: Vec<Box<dyn StreamingIterator<Item = [u8]> + Send + Sync + 'a>>,
+    buffer: Vec<u8>,
+}
+
+impl<'a> RecordSerializer<'a> {
+    /// Creates a new [`RecordSerializer`].
+    pub fn new<A>(schema: Schema, chunk: &'a Chunk<A>, buffer: Vec<u8>) -> Self
+    where
+        A: AsRef<dyn Array>,
+    {
+        let end = chunk.len();
+        let iterators = chunk
+            .arrays()
+            .iter()
+            .map(|arr| new_serializer(arr.as_ref(), 0, usize::MAX))
+            .collect();
+
+        Self {
+            schema,
+            index: 0,
+            end,
+            iterators,
+            buffer,
+        }
+    }
+}
+
+impl<'a> FallibleStreamingIterator for RecordSerializer<'a> {
+    type Item = [u8];
+
+    type Error = Error;
+
+    fn advance(&mut self) -> Result<(), Error> {
+        self.buffer.clear();
+        if self.index == self.end {
+            return Ok(());
+        }
+
+        let mut is_first_row = true;
+        write!(&mut self.buffer, "{{")?;
+        for (f, ref mut it) in self.schema.fields.iter().zip(self.iterators.iter_mut()) {
+            if !is_first_row {
+                write!(&mut self.buffer, ",")?;
+            }
+            write!(&mut self.buffer, "\"{}\":", f.name)?;
+
+            self.buffer.extend_from_slice(it.next().unwrap());
+            is_first_row = false;
+        }
+        write!(&mut self.buffer, "}}")?;
+
+        self.index += 1;
+        Ok(())
+    }
+
+    fn get(&self) -> Option<&Self::Item> {
+        if !self.buffer.is_empty() {
+            Some(&self.buffer)
+        } else {
+            None
+        }
+    }
+}
+
+/// Writes valid JSON from an iterator of (assumed JSON-encoded) bytes to `writer`
+pub fn write<W, I>(writer: &mut W, mut blocks: I) -> Result<(), Error>
+where
+    W: std::io::Write,
+    I: FallibleStreamingIterator<Item = [u8], Error = Error>,
+{
+    writer.write_all(&[b'['])?;
+    let mut is_first_row = true;
+    while let Some(block) = blocks.next()? {
+        if !is_first_row {
+            writer.write_all(&[b','])?;
+        }
+        is_first_row = false;
+        writer.write_all(block)?;
+    }
+    writer.write_all(&[b']'])?;
+    Ok(())
+}
diff --git a/crates/polars-json/src/json/write/serialize.rs b/crates/polars-json/src/json/write/serialize.rs
new file mode 100644
index 000000000000..89453fe144c4
--- /dev/null
+++ b/crates/polars-json/src/json/write/serialize.rs
@@ -0,0 +1,512 @@
+use std::io::Write;
+
+use arrow::array::*;
+use arrow::bitmap::utils::ZipValidity;
+use arrow::datatypes::{DataType, IntegerType, TimeUnit};
+use arrow::io::iterator::BufStreamingIterator;
+use arrow::offset::Offset;
+#[cfg(feature = "chrono-tz")]
+use arrow::temporal_conversions::parse_offset_tz;
+use arrow::temporal_conversions::{
+    date32_to_date, date64_to_date, duration_ms_to_duration, duration_ns_to_duration,
+    duration_s_to_duration, duration_us_to_duration, parse_offset, timestamp_ms_to_datetime,
+    timestamp_ns_to_datetime, timestamp_s_to_datetime, timestamp_to_datetime,
+    timestamp_us_to_datetime,
+};
+use arrow::types::NativeType;
+use arrow::util::lexical_to_bytes_mut;
+use chrono::{Duration, NaiveDate, NaiveDateTime};
+use lexical_core::ToLexical;
+use streaming_iterator::StreamingIterator;
+
+use super::utf8;
+
+fn materialize_serializer<'a, I, F, T>(
+    f: F,
+    iterator: I,
+    offset: usize,
+    take: usize,
+) -> Box<dyn StreamingIterator<Item = [u8]> + 'a + Send + Sync>
+where
+    T: 'a,
+    I: Iterator<Item = T> + Send + Sync + 'a,
+    F: FnMut(T, &mut Vec<u8>) + Send + Sync + 'a,
+{
+    if offset > 0 || take < usize::MAX {
+        Box::new(BufStreamingIterator::new(
+            iterator.skip(offset).take(take),
+            f,
+            vec![],
+        ))
+    } else {
+        Box::new(BufStreamingIterator::new(iterator, f, vec![]))
+    }
+}
+
+fn boolean_serializer<'a>(
+    array: &'a BooleanArray,
+    offset: usize,
+    take: usize,
+) -> Box<dyn StreamingIterator<Item = [u8]> + 'a + Send + Sync> {
+    let f = |x: Option<bool>, buf: &mut Vec<u8>| match x {
+        Some(true) => buf.extend_from_slice(b"true"),
+        Some(false) => buf.extend_from_slice(b"false"),
+        None => buf.extend_from_slice(b"null"),
+    };
+    materialize_serializer(f, array.iter(), offset, take)
+}
+
+fn null_serializer(
+    len: usize,
+    offset: usize,
+    take: usize,
+) -> Box<dyn StreamingIterator<Item = [u8]> + Send + Sync> {
+    let f = |_x: (), buf: &mut Vec<u8>| buf.extend_from_slice(b"null");
+    materialize_serializer(f, std::iter::repeat(()).take(len), offset, take)
+}
+
+fn primitive_serializer<'a, T: NativeType + ToLexical>(
+    array: &'a PrimitiveArray<T>,
+    offset: usize,
+    take: usize,
+) -> Box<dyn StreamingIterator<Item = [u8]> + 'a + Send + Sync> {
+    let f = |x: Option<&T>, buf: &mut Vec<u8>| {
+        if let Some(x) = x {
+            lexical_to_bytes_mut(*x, buf)
+        } else {
+            buf.extend(b"null")
+        }
+    };
+    materialize_serializer(f, array.iter(), offset, take)
+}
+
+fn float_serializer<'a, T>(
+    array: &'a PrimitiveArray<T>,
+    offset: usize,
+    take: usize,
+) -> Box<dyn StreamingIterator<Item = [u8]> + 'a + Send + Sync>
+where
+    T: num_traits::Float + NativeType + ToLexical,
+{
+    let f = |x: Option<&T>, buf: &mut Vec<u8>| {
+        if let Some(x) = x {
+            if T::is_nan(*x) || T::is_infinite(*x) {
+                buf.extend(b"null")
+            } else {
+                lexical_to_bytes_mut(*x, buf)
+            }
+        } else {
+            buf.extend(b"null")
+        }
+    };
+
+    materialize_serializer(f, array.iter(), offset, take)
+}
+
+fn dictionary_utf8_serializer<'a, K: DictionaryKey, O: Offset>(
+    array: &'a DictionaryArray<K>,
+    offset: usize,
+    take: usize,
+) -> Box<dyn StreamingIterator<Item = [u8]> + 'a + Send + Sync> {
+    let iter = array.iter_typed::<Utf8Array<O>>().unwrap().skip(offset);
+    let f = |x: Option<&str>, buf: &mut Vec<u8>| {
+        if let Some(x) = x {
+            utf8::write_str(buf, x).unwrap();
+        } else {
+            buf.extend_from_slice(b"null")
+        }
+    };
+    materialize_serializer(f, iter, offset, take)
+}
+
+fn utf8_serializer<'a, O: Offset>(
+    array: &'a Utf8Array<O>,
+    offset: usize,
+    take: usize,
+) -> Box<dyn StreamingIterator<Item = [u8]> + 'a + Send + Sync> {
+    let f = |x: Option<&str>, buf: &mut Vec<u8>| {
+        if let Some(x) = x {
+            utf8::write_str(buf, x).unwrap();
+        } else {
+            buf.extend_from_slice(b"null")
+        }
+    };
+    materialize_serializer(f, array.iter(), offset, take)
+}
+
+fn struct_serializer<'a>(
+    array: &'a StructArray,
+    offset: usize,
+    take: usize,
+) -> Box<dyn StreamingIterator<Item = [u8]> + 'a + Send + Sync> {
+    // {"a": [1, 2, 3], "b": [a, b, c], "c": {"a": [1, 2, 3]}}
+    // [
+    //  {"a": 1, "b": a, "c": {"a": 1}},
+    //  {"a": 2, "b": b, "c": {"a": 2}},
+    //  {"a": 3, "b": c, "c": {"a": 3}},
+    // ]
+    //
+    let mut serializers = array
+        .values()
+        .iter()
+        .map(|x| x.as_ref())
+        .map(|arr| new_serializer(arr, offset, take))
+        .collect::<Vec<_>>();
+    let names = array.fields().iter().map(|f| f.name.as_str());
+
+    Box::new(BufStreamingIterator::new(
+        ZipValidity::new_with_validity(0..array.len(), array.validity()),
+        move |maybe, buf| {
+            if maybe.is_some() {
+                let names = names.clone();
+                let mut record: Vec<(&str, &[u8])> = Default::default();
+                serializers
+                    .iter_mut()
+                    .zip(names)
+                    // `unwrap` is infalible because `array.len()` equals `len` on `Chunk`
+                    .for_each(|(iter, name)| {
+                        let item = iter.next().unwrap();
+                        record.push((name, item));
+                    });
+                serialize_item(buf, &record, true);
+            } else {
+                serializers.iter_mut().for_each(|iter| {
+                    let _ = iter.next();
+                });
+                buf.extend(b"null");
+            }
+        },
+        vec![],
+    ))
+}
+
+fn list_serializer<'a, O: Offset>(
+    array: &'a ListArray<O>,
+    offset: usize,
+    take: usize,
+) -> Box<dyn StreamingIterator<Item = [u8]> + 'a + Send + Sync> {
+    // [[1, 2], [3]]
+    // [
+    //  [1, 2],
+    //  [3]
+    // ]
+    //
+    let offsets = array.offsets().as_slice();
+    let start = offsets[0].to_usize();
+    let end = offsets.last().unwrap().to_usize();
+    let mut serializer = new_serializer(array.values().as_ref(), start, end - start);
+
+    let f = move |offset: Option<&[O]>, buf: &mut Vec<u8>| {
+        if let Some(offset) = offset {
+            let length = (offset[1] - offset[0]).to_usize();
+            buf.push(b'[');
+            let mut is_first_row = true;
+            for _ in 0..length {
+                if !is_first_row {
+                    buf.push(b',');
+                }
+                is_first_row = false;
+                buf.extend(serializer.next().unwrap());
+            }
+            buf.push(b']');
+        } else {
+            buf.extend(b"null");
+        }
+    };
+
+    let iter =
+        ZipValidity::new_with_validity(array.offsets().buffer().windows(2), array.validity());
+    materialize_serializer(f, iter, offset, take)
+}
+
+fn fixed_size_list_serializer<'a>(
+    array: &'a FixedSizeListArray,
+    offset: usize,
+    take: usize,
+) -> Box<dyn StreamingIterator<Item = [u8]> + 'a + Send + Sync> {
+    let mut serializer = new_serializer(array.values().as_ref(), offset, take);
+
+    Box::new(BufStreamingIterator::new(
+        ZipValidity::new(0..array.len(), array.validity().map(|x| x.iter())),
+        move |ix, buf| {
+            if ix.is_some() {
+                let length = array.size();
+                buf.push(b'[');
+                let mut is_first_row = true;
+                for _ in 0..length {
+                    if !is_first_row {
+                        buf.push(b',');
+                    }
+                    is_first_row = false;
+                    buf.extend(serializer.next().unwrap());
+                }
+                buf.push(b']');
+            } else {
+                buf.extend(b"null");
+            }
+        },
+        vec![],
+    ))
+}
+
+fn date_serializer<'a, T, F>(
+    array: &'a PrimitiveArray<T>,
+    convert: F,
+    offset: usize,
+    take: usize,
+) -> Box<dyn StreamingIterator<Item = [u8]> + 'a + Send + Sync>
+where
+    T: NativeType,
+    F: Fn(T) -> NaiveDate + 'static + Send + Sync,
+{
+    let f = move |x: Option<&T>, buf: &mut Vec<u8>| {
+        if let Some(x) = x {
+            let nd = convert(*x);
+            write!(buf, "\"{nd}\"").unwrap();
+        } else {
+            buf.extend_from_slice(b"null")
+        }
+    };
+
+    materialize_serializer(f, array.iter(), offset, take)
+}
+
+fn duration_serializer<'a, T, F>(
+    array: &'a PrimitiveArray<T>,
+    convert: F,
+    offset: usize,
+    take: usize,
+) -> Box<dyn StreamingIterator<Item = [u8]> + 'a + Send + Sync>
+where
+    T: NativeType,
+    F: Fn(T) -> Duration + 'static + Send + Sync,
+{
+    let f = move |x: Option<&T>, buf: &mut Vec<u8>| {
+        if let Some(x) = x {
+            let duration = convert(*x);
+            write!(buf, "\"{duration}\"").unwrap();
+        } else {
+            buf.extend_from_slice(b"null")
+        }
+    };
+
+    materialize_serializer(f, array.iter(), offset, take)
+}
+
+fn timestamp_serializer<'a, F>(
+    array: &'a PrimitiveArray<i64>,
+    convert: F,
+    offset: usize,
+    take: usize,
+) -> Box<dyn StreamingIterator<Item = [u8]> + 'a + Send + Sync>
+where
+    F: Fn(i64) -> NaiveDateTime + 'static + Send + Sync,
+{
+    let f = move |x: Option<&i64>, buf: &mut Vec<u8>| {
+        if let Some(x) = x {
+            let ndt = convert(*x);
+            write!(buf, "\"{ndt}\"").unwrap();
+        } else {
+            buf.extend_from_slice(b"null")
+        }
+    };
+    materialize_serializer(f, array.iter(), offset, take)
+}
+
+fn timestamp_tz_serializer<'a>(
+    array: &'a PrimitiveArray<i64>,
+    time_unit: TimeUnit,
+    tz: &str,
+    offset: usize,
+    take: usize,
+) -> Box<dyn StreamingIterator<Item = [u8]> + 'a + Send + Sync> {
+    match parse_offset(tz) {
+        Ok(parsed_tz) => {
+            let f = move |x: Option<&i64>, buf: &mut Vec<u8>| {
+                if let Some(x) = x {
+                    let dt_str = timestamp_to_datetime(*x, time_unit, &parsed_tz).to_rfc3339();
+                    write!(buf, "\"{dt_str}\"").unwrap();
+                } else {
+                    buf.extend_from_slice(b"null")
+                }
+            };
+
+            materialize_serializer(f, array.iter(), offset, take)
+        },
+        #[cfg(feature = "chrono-tz")]
+        _ => match parse_offset_tz(tz) {
+            Ok(parsed_tz) => {
+                let f = move |x: Option<&i64>, buf: &mut Vec<u8>| {
+                    if let Some(x) = x {
+                        let dt_str = timestamp_to_datetime(*x, time_unit, &parsed_tz).to_rfc3339();
+                        write!(buf, "\"{dt_str}\"").unwrap();
+                    } else {
+                        buf.extend_from_slice(b"null")
+                    }
+                };
+
+                materialize_serializer(f, array.iter(), offset, take)
+            },
+            _ => {
+                panic!("Timezone {} is invalid or not supported", tz);
+            },
+        },
+        #[cfg(not(feature = "chrono-tz"))]
+        _ => {
+            panic!("Invalid Offset format (must be [-]00:00) or chrono-tz feature not active");
+        },
+    }
+}
+
+pub(crate) fn new_serializer<'a>(
+    array: &'a dyn Array,
+    offset: usize,
+    take: usize,
+) -> Box<dyn StreamingIterator<Item = [u8]> + 'a + Send + Sync> {
+    match array.data_type().to_logical_type() {
+        DataType::Boolean => {
+            boolean_serializer(array.as_any().downcast_ref().unwrap(), offset, take)
+        },
+        DataType::Int8 => {
+            primitive_serializer::<i8>(array.as_any().downcast_ref().unwrap(), offset, take)
+        },
+        DataType::Int16 => {
+            primitive_serializer::<i16>(array.as_any().downcast_ref().unwrap(), offset, take)
+        },
+        DataType::Int32 => {
+            primitive_serializer::<i32>(array.as_any().downcast_ref().unwrap(), offset, take)
+        },
+        DataType::Int64 => {
+            primitive_serializer::<i64>(array.as_any().downcast_ref().unwrap(), offset, take)
+        },
+        DataType::UInt8 => {
+            primitive_serializer::<u8>(array.as_any().downcast_ref().unwrap(), offset, take)
+        },
+        DataType::UInt16 => {
+            primitive_serializer::<u16>(array.as_any().downcast_ref().unwrap(), offset, take)
+        },
+        DataType::UInt32 => {
+            primitive_serializer::<u32>(array.as_any().downcast_ref().unwrap(), offset, take)
+        },
+        DataType::UInt64 => {
+            primitive_serializer::<u64>(array.as_any().downcast_ref().unwrap(), offset, take)
+        },
+        DataType::Float32 => {
+            float_serializer::<f32>(array.as_any().downcast_ref().unwrap(), offset, take)
+        },
+        DataType::Float64 => {
+            float_serializer::<f64>(array.as_any().downcast_ref().unwrap(), offset, take)
+        },
+        DataType::Utf8 => {
+            utf8_serializer::<i32>(array.as_any().downcast_ref().unwrap(), offset, take)
+        },
+        DataType::LargeUtf8 => {
+            utf8_serializer::<i64>(array.as_any().downcast_ref().unwrap(), offset, take)
+        },
+        DataType::Struct(_) => {
+            struct_serializer(array.as_any().downcast_ref().unwrap(), offset, take)
+        },
+        DataType::FixedSizeList(_, _) => {
+            fixed_size_list_serializer(array.as_any().downcast_ref().unwrap(), offset, take)
+        },
+        DataType::List(_) => {
+            list_serializer::<i32>(array.as_any().downcast_ref().unwrap(), offset, take)
+        },
+        DataType::LargeList(_) => {
+            list_serializer::<i64>(array.as_any().downcast_ref().unwrap(), offset, take)
+        },
+        other @ DataType::Dictionary(k, v, _) => match (k, &**v) {
+            (IntegerType::UInt32, DataType::LargeUtf8) => {
+                let array = array
+                    .as_any()
+                    .downcast_ref::<DictionaryArray<u32>>()
+                    .unwrap();
+                dictionary_utf8_serializer::<u32, i64>(array, offset, take)
+            },
+            _ => {
+                todo!("Writing {:?} to JSON", other)
+            },
+        },
+        DataType::Date32 => date_serializer(
+            array.as_any().downcast_ref().unwrap(),
+            date32_to_date,
+            offset,
+            take,
+        ),
+        DataType::Date64 => date_serializer(
+            array.as_any().downcast_ref().unwrap(),
+            date64_to_date,
+            offset,
+            take,
+        ),
+        DataType::Timestamp(tu, None) => {
+            let convert = match tu {
+                TimeUnit::Nanosecond => timestamp_ns_to_datetime,
+                TimeUnit::Microsecond => timestamp_us_to_datetime,
+                TimeUnit::Millisecond => timestamp_ms_to_datetime,
+                TimeUnit::Second => timestamp_s_to_datetime,
+            };
+            timestamp_serializer(
+                array.as_any().downcast_ref().unwrap(),
+                convert,
+                offset,
+                take,
+            )
+        },
+        DataType::Timestamp(time_unit, Some(tz)) => timestamp_tz_serializer(
+            array.as_any().downcast_ref().unwrap(),
+            *time_unit,
+            tz,
+            offset,
+            take,
+        ),
+        DataType::Duration(tu) => {
+            let convert = match tu {
+                TimeUnit::Nanosecond => duration_ns_to_duration,
+                TimeUnit::Microsecond => duration_us_to_duration,
+                TimeUnit::Millisecond => duration_ms_to_duration,
+                TimeUnit::Second => duration_s_to_duration,
+            };
+            duration_serializer(
+                array.as_any().downcast_ref().unwrap(),
+                convert,
+                offset,
+                take,
+            )
+        },
+        DataType::Null => null_serializer(array.len(), offset, take),
+        other => todo!("Writing {:?} to JSON", other),
+    }
+}
+
+fn serialize_item(buffer: &mut Vec<u8>, record: &[(&str, &[u8])], is_first_row: bool) {
+    if !is_first_row {
+        buffer.push(b',');
+    }
+    buffer.push(b'{');
+    let mut first_item = true;
+    for (key, value) in record {
+        if !first_item {
+            buffer.push(b',');
+        }
+        first_item = false;
+        utf8::write_str(buffer, key).unwrap();
+        buffer.push(b':');
+        buffer.extend(*value);
+    }
+    buffer.push(b'}');
+}
+
+/// Serializes `array` to a valid JSON to `buffer`
+/// # Implementation
+/// This operation is CPU-bounded
+pub(crate) fn serialize(array: &dyn Array, buffer: &mut Vec<u8>) {
+    let mut serializer = new_serializer(array, 0, usize::MAX);
+
+    (0..array.len()).for_each(|i| {
+        if i != 0 {
+            buffer.push(b',');
+        }
+        buffer.extend_from_slice(serializer.next().unwrap());
+    });
+}
diff --git a/crates/polars-json/src/json/write/utf8.rs b/crates/polars-json/src/json/write/utf8.rs
new file mode 100644
index 000000000000..941d73379c3d
--- /dev/null
+++ b/crates/polars-json/src/json/write/utf8.rs
@@ -0,0 +1,138 @@
+// Adapted from https://github.com/serde-rs/json/blob/f901012df66811354cb1d490ad59480d8fdf77b5/src/ser.rs
+use std::io;
+
+pub fn write_str<W>(writer: &mut W, value: &str) -> io::Result<()>
+where
+    W: io::Write,
+{
+    writer.write_all(b"\"")?;
+    let bytes = value.as_bytes();
+
+    let mut start = 0;
+
+    for (i, &byte) in bytes.iter().enumerate() {
+        let escape = ESCAPE[byte as usize];
+        if escape == 0 {
+            continue;
+        }
+
+        if start < i {
+            writer.write_all(&bytes[start..i])?;
+        }
+
+        let char_escape = CharEscape::from_escape_table(escape, byte);
+        write_char_escape(writer, char_escape)?;
+
+        start = i + 1;
+    }
+
+    if start != bytes.len() {
+        writer.write_all(&bytes[start..])?;
+    }
+    writer.write_all(b"\"")
+}
+
+const BB: u8 = b'b'; // \x08
+const TT: u8 = b't'; // \x09
+const NN: u8 = b'n'; // \x0A
+const FF: u8 = b'f'; // \x0C
+const RR: u8 = b'r'; // \x0D
+const QU: u8 = b'"'; // \x22
+const BS: u8 = b'\\'; // \x5C
+const UU: u8 = b'u'; // \x00...\x1F except the ones above
+const __: u8 = 0;
+
+// Lookup table of escape sequences. A value of b'x' at index i means that byte
+// i is escaped as "\x" in JSON. A value of 0 means that byte i is not escaped.
+static ESCAPE: [u8; 256] = [
+    //   1   2   3   4   5   6   7   8   9   A   B   C   D   E   F
+    UU, UU, UU, UU, UU, UU, UU, UU, BB, TT, NN, UU, FF, RR, UU, UU, // 0
+    UU, UU, UU, UU, UU, UU, UU, UU, UU, UU, UU, UU, UU, UU, UU, UU, // 1
+    __, __, QU, __, __, __, __, __, __, __, __, __, __, __, __, __, // 2
+    __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, // 3
+    __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, // 4
+    __, __, __, __, __, __, __, __, __, __, __, __, BS, __, __, __, // 5
+    __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, // 6
+    __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, // 7
+    __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, // 8
+    __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, // 9
+    __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, // A
+    __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, // B
+    __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, // C
+    __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, // D
+    __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, // E
+    __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, __, // F
+];
+
+/// Represents a character escape code in a type-safe manner.
+pub enum CharEscape {
+    /// An escaped quote `"`
+    Quote,
+    /// An escaped reverse solidus `\`
+    ReverseSolidus,
+    // An escaped solidus `/`
+    //Solidus,
+    /// An escaped backspace character (usually escaped as `\b`)
+    Backspace,
+    /// An escaped form feed character (usually escaped as `\f`)
+    FormFeed,
+    /// An escaped line feed character (usually escaped as `\n`)
+    LineFeed,
+    /// An escaped carriage return character (usually escaped as `\r`)
+    CarriageReturn,
+    /// An escaped tab character (usually escaped as `\t`)
+    Tab,
+    /// An escaped ASCII plane control character (usually escaped as
+    /// `\u00XX` where `XX` are two hex characters)
+    AsciiControl(u8),
+}
+
+impl CharEscape {
+    #[inline]
+    fn from_escape_table(escape: u8, byte: u8) -> CharEscape {
+        match escape {
+            self::BB => CharEscape::Backspace,
+            self::TT => CharEscape::Tab,
+            self::NN => CharEscape::LineFeed,
+            self::FF => CharEscape::FormFeed,
+            self::RR => CharEscape::CarriageReturn,
+            self::QU => CharEscape::Quote,
+            self::BS => CharEscape::ReverseSolidus,
+            self::UU => CharEscape::AsciiControl(byte),
+            _ => unreachable!(),
+        }
+    }
+}
+
+#[inline]
+fn write_char_escape<W>(writer: &mut W, char_escape: CharEscape) -> io::Result<()>
+where
+    W: io::Write,
+{
+    use self::CharEscape::*;
+
+    let s = match char_escape {
+        Quote => b"\\\"",
+        ReverseSolidus => b"\\\\",
+        //Solidus => b"\\/",
+        Backspace => b"\\b",
+        FormFeed => b"\\f",
+        LineFeed => b"\\n",
+        CarriageReturn => b"\\r",
+        Tab => b"\\t",
+        AsciiControl(byte) => {
+            static HEX_DIGITS: [u8; 16] = *b"0123456789abcdef";
+            let bytes = &[
+                b'\\',
+                b'u',
+                b'0',
+                b'0',
+                HEX_DIGITS[(byte >> 4) as usize],
+                HEX_DIGITS[(byte & 0xF) as usize],
+            ];
+            return writer.write_all(bytes);
+        },
+    };
+
+    writer.write_all(s)
+}
diff --git a/crates/polars-json/src/ndjson/mod.rs b/crates/polars-json/src/ndjson/mod.rs
index 429b1096b1ae..2076715e711f 100644
--- a/crates/polars-json/src/ndjson/mod.rs
+++ b/crates/polars-json/src/ndjson/mod.rs
@@ -3,5 +3,6 @@ use polars_arrow::prelude::*;
 use polars_error::*;
 pub mod deserialize;
 mod file;
+pub mod write;
 
 pub use file::{infer, infer_iter};
diff --git a/crates/polars-json/src/ndjson/write.rs b/crates/polars-json/src/ndjson/write.rs
new file mode 100644
index 000000000000..5cbda120711f
--- /dev/null
+++ b/crates/polars-json/src/ndjson/write.rs
@@ -0,0 +1,118 @@
+//! APIs to serialize and write to [NDJSON](http://ndjson.org/).
+use std::io::Write;
+
+use arrow::array::Array;
+use arrow::error::Error;
+pub use fallible_streaming_iterator::FallibleStreamingIterator;
+
+use super::super::json::write::new_serializer;
+
+fn serialize(array: &dyn Array, buffer: &mut Vec<u8>) {
+    let mut serializer = new_serializer(array, 0, usize::MAX);
+    (0..array.len()).for_each(|_| {
+        buffer.extend_from_slice(serializer.next().unwrap());
+        buffer.push(b'\n');
+    });
+}
+
+/// [`FallibleStreamingIterator`] that serializes an [`Array`] to bytes of valid NDJSON
+/// where every line is an element of the array.
+/// # Implementation
+/// Advancing this iterator CPU-bounded
+#[derive(Debug, Clone)]
+pub struct Serializer<A, I>
+where
+    A: AsRef<dyn Array>,
+    I: Iterator<Item = Result<A, Error>>,
+{
+    arrays: I,
+    buffer: Vec<u8>,
+}
+
+impl<A, I> Serializer<A, I>
+where
+    A: AsRef<dyn Array>,
+    I: Iterator<Item = Result<A, Error>>,
+{
+    /// Creates a new [`Serializer`].
+    pub fn new(arrays: I, buffer: Vec<u8>) -> Self {
+        Self { arrays, buffer }
+    }
+}
+
+impl<A, I> FallibleStreamingIterator for Serializer<A, I>
+where
+    A: AsRef<dyn Array>,
+    I: Iterator<Item = Result<A, Error>>,
+{
+    type Item = [u8];
+
+    type Error = Error;
+
+    fn advance(&mut self) -> Result<(), Error> {
+        self.buffer.clear();
+        self.arrays
+            .next()
+            .map(|maybe_array| maybe_array.map(|array| serialize(array.as_ref(), &mut self.buffer)))
+            .transpose()?;
+        Ok(())
+    }
+
+    fn get(&self) -> Option<&Self::Item> {
+        if !self.buffer.is_empty() {
+            Some(&self.buffer)
+        } else {
+            None
+        }
+    }
+}
+
+/// An iterator adapter that receives an implementer of [`Write`] and
+/// an implementer of [`FallibleStreamingIterator`] (such as [`Serializer`])
+/// and writes a valid NDJSON
+/// # Implementation
+/// Advancing this iterator mixes CPU-bounded (serializing arrays) tasks and IO-bounded (write to the writer).
+pub struct FileWriter<W, I>
+where
+    W: Write,
+    I: FallibleStreamingIterator<Item = [u8], Error = Error>,
+{
+    writer: W,
+    iterator: I,
+}
+
+impl<W, I> FileWriter<W, I>
+where
+    W: Write,
+    I: FallibleStreamingIterator<Item = [u8], Error = Error>,
+{
+    /// Creates a new [`FileWriter`].
+    pub fn new(writer: W, iterator: I) -> Self {
+        Self { writer, iterator }
+    }
+
+    /// Returns the inner content of this iterator
+    ///
+    /// There are two use-cases for this function:
+    /// * to continue writing to its writer
+    /// * to re-use an internal buffer of its iterator
+    pub fn into_inner(self) -> (W, I) {
+        (self.writer, self.iterator)
+    }
+}
+
+impl<W, I> Iterator for FileWriter<W, I>
+where
+    W: Write,
+    I: FallibleStreamingIterator<Item = [u8], Error = Error>,
+{
+    type Item = Result<(), Error>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        let item = self.iterator.next().transpose()?;
+        Some(item.and_then(|x| {
+            self.writer.write_all(x)?;
+            Ok(())
+        }))
+    }
+}
diff --git a/crates/polars-ops/Cargo.toml b/crates/polars-ops/Cargo.toml
index 9f8af54f742e..272cca8e65c7 100644
--- a/crates/polars-ops/Cargo.toml
+++ b/crates/polars-ops/Cargo.toml
@@ -16,11 +16,11 @@ polars-utils = { workspace = true, default-features = false }
 
 argminmax = { version = "0.6.1", default-features = false, features = ["float"] }
 arrow = { workspace = true }
-base64 = { version = "0.21", optional = true }
+base64 = { workspace = true, optional = true }
 chrono = { workspace = true, optional = true }
 chrono-tz = { workspace = true, optional = true }
 either = { workspace = true }
-hex = { version = "0.4", optional = true }
+hex = { workspace = true, optional = true }
 indexmap = { workspace = true }
 jsonpath_lib = { version = "0.3", optional = true, git = "https://github.com/ritchie46/jsonpath", branch = "improve_compiled" }
 memchr = { workspace = true }
diff --git a/crates/polars-ops/src/chunked_array/strings/mod.rs b/crates/polars-ops/src/chunked_array/strings/mod.rs
index 3caaec8a9dba..caed488b40a9 100644
--- a/crates/polars-ops/src/chunked_array/strings/mod.rs
+++ b/crates/polars-ops/src/chunked_array/strings/mod.rs
@@ -10,6 +10,8 @@ mod justify;
 mod namespace;
 #[cfg(feature = "strings")]
 mod replace;
+#[cfg(feature = "strings")]
+mod substring;
 
 #[cfg(feature = "extract_jsonpath")]
 pub use json_path::*;
diff --git a/crates/polars-ops/src/chunked_array/strings/namespace.rs b/crates/polars-ops/src/chunked_array/strings/namespace.rs
index c5fddf7583a0..fae3a127143c 100644
--- a/crates/polars-ops/src/chunked_array/strings/namespace.rs
+++ b/crates/polars-ops/src/chunked_array/strings/namespace.rs
@@ -2,8 +2,6 @@
 use base64::engine::general_purpose;
 #[cfg(feature = "string_encoding")]
 use base64::Engine as _;
-use polars_arrow::export::arrow::compute::substring::substring;
-use polars_arrow::export::arrow::{self};
 use polars_arrow::kernels::string::*;
 #[cfg(feature = "string_from_radix")]
 use polars_core::export::num::Num;
@@ -502,14 +500,12 @@ pub trait Utf8NameSpaceImpl: AsUtf8 {
     ///
     /// Determines a substring starting from `start` and with optional length `length` of each of the elements in `array`.
     /// `start` can be negative, in which case the start counts from the end of the string.
-    fn str_slice(&self, start: i64, length: Option<u64>) -> PolarsResult<Utf8Chunked> {
+    fn str_slice(&self, start: i64, length: Option<u64>) -> Utf8Chunked {
         let ca = self.as_utf8();
-        let chunks = ca
+        let iter = ca
             .downcast_iter()
-            .map(|c| substring(c, start, &length))
-            .collect::<arrow::error::Result<_>>()?;
-        // SAFETY: these are all the same type.
-        unsafe { Ok(Utf8Chunked::from_chunks(ca.name(), chunks)) }
+            .map(|c| substring::utf8_substring(c, start, &length));
+        Utf8Chunked::from_chunk_iter_like(ca, iter)
     }
 }
 
diff --git a/crates/polars-ops/src/chunked_array/strings/substring.rs b/crates/polars-ops/src/chunked_array/strings/substring.rs
new file mode 100644
index 000000000000..e485e25dd216
--- /dev/null
+++ b/crates/polars-ops/src/chunked_array/strings/substring.rs
@@ -0,0 +1,51 @@
+use arrow::array::Utf8Array;
+
+/// Returns a Utf8Array<O> with a substring starting from `start` and with optional length `length` of each of the elements in `array`.
+/// `start` can be negative, in which case the start counts from the end of the string.
+pub(super) fn utf8_substring(
+    array: &Utf8Array<i64>,
+    start: i64,
+    length: &Option<u64>,
+) -> Utf8Array<i64> {
+    let length = length.map(|v| v as usize);
+
+    let iter = array.values_iter().map(|str_val| {
+        // compute where we should start slicing this entry.
+        let start = if start >= 0 {
+            start as usize
+        } else {
+            let start = (0i64 - start) as usize;
+            str_val
+                .char_indices()
+                .rev()
+                .nth(start)
+                .map(|(idx, _)| idx + 1)
+                .unwrap_or(0)
+        };
+
+        let mut iter_chars = str_val.char_indices();
+        if let Some((start_idx, _)) = iter_chars.nth(start) {
+            // length of the str
+            let len_end = str_val.len() - start_idx;
+
+            // length to slice
+            let length = length.unwrap_or(len_end);
+
+            if length == 0 {
+                return "";
+            }
+            // compute
+            let end_idx = iter_chars
+                .nth(length.saturating_sub(1))
+                .map(|(idx, _)| idx)
+                .unwrap_or(str_val.len());
+
+            &str_val[start_idx..end_idx]
+        } else {
+            ""
+        }
+    });
+
+    let new = Utf8Array::<i64>::from_trusted_len_values_iter(iter);
+    new.with_validity(array.validity().cloned())
+}
diff --git a/crates/polars-plan/src/dsl/function_expr/strings.rs b/crates/polars-plan/src/dsl/function_expr/strings.rs
index fb62190e2869..d9f72c0b1ff6 100644
--- a/crates/polars-plan/src/dsl/function_expr/strings.rs
+++ b/crates/polars-plan/src/dsl/function_expr/strings.rs
@@ -744,7 +744,7 @@ pub(super) fn from_radix(s: &Series, radix: u32, strict: bool) -> PolarsResult<S
 }
 pub(super) fn str_slice(s: &Series, start: i64, length: Option<u64>) -> PolarsResult<Series> {
     let ca = s.utf8()?;
-    ca.str_slice(start, length).map(|ca| ca.into_series())
+    Ok(ca.str_slice(start, length).into_series())
 }
 
 pub(super) fn explode(s: &Series) -> PolarsResult<Series> {
diff --git a/crates/polars-sql/Cargo.toml b/crates/polars-sql/Cargo.toml
index 0b72313cae27..30f65a7565d7 100644
--- a/crates/polars-sql/Cargo.toml
+++ b/crates/polars-sql/Cargo.toml
@@ -9,7 +9,7 @@ repository = { workspace = true }
 description = "SQL transpiler for Polars. Converts SQL to Polars logical plans"
 
 [dependencies]
-polars-arrow = { workspace = true, features = ["like"] }
+polars-arrow = { workspace = true }
 polars-core = { workspace = true }
 polars-lazy = { workspace = true, features = ["strings", "cross_join", "trigonometry", "abs", "round_series", "log", "regex", "is_in", "meta", "cum_agg"] }
 polars-plan = { workspace = true }
diff --git a/py-polars/Cargo.lock b/py-polars/Cargo.lock
index 80af294ee9f7..0b88f92c9540 100644
--- a/py-polars/Cargo.lock
+++ b/py-polars/Cargo.lock
@@ -96,42 +96,6 @@ dependencies = [
  "serde",
 ]
 
-[[package]]
-name = "arrow2"
-version = "0.18.0"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "963fef509b757bcbbf9e5ffa23bcb345614d99f4f6f531f97417b27b8604d389"
-dependencies = [
- "ahash",
- "arrow-format",
- "avro-schema",
- "base64",
- "bytemuck",
- "chrono",
- "chrono-tz",
- "dyn-clone",
- "either",
- "ethnum",
- "fallible-streaming-iterator",
- "foreign_vec",
- "futures",
- "getrandom",
- "hash_hasher",
- "hashbrown 0.14.0",
- "lexical-core",
- "lz4",
- "multiversion",
- "num-traits",
- "parquet2",
- "regex",
- "regex-syntax",
- "rustc_version",
- "simdutf8",
- "streaming-iterator",
- "strength_reduce",
- "zstd",
-]
-
 [[package]]
 name = "async-stream"
 version = "0.3.5"
@@ -315,8 +279,10 @@ checksum = "7f2c685bad3eb3d45a01354cedb7d5faa66194d1d58ba6e267a8de788f79db38"
 dependencies = [
  "android-tzdata",
  "iana-time-zone",
+ "js-sys",
  "num-traits",
  "serde",
+ "wasm-bindgen",
  "windows-targets",
 ]
 
@@ -718,12 +684,6 @@ dependencies = [
  "serde",
 ]
 
-[[package]]
-name = "hash_hasher"
-version = "2.0.3"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "74721d007512d0cb3338cd20f0654ac913920061a4c4d0d8708edb3f2a698c0c"
-
 [[package]]
 name = "hashbrown"
 version = "0.13.2"
@@ -1168,6 +1128,37 @@ dependencies = [
  "target-features",
 ]
 
+[[package]]
+name = "nano-arrow"
+version = "0.1.0"
+dependencies = [
+ "ahash",
+ "arrow-format",
+ "avro-schema",
+ "base64",
+ "bytemuck",
+ "chrono",
+ "chrono-tz",
+ "dyn-clone",
+ "either",
+ "ethnum",
+ "fallible-streaming-iterator",
+ "foreign_vec",
+ "futures",
+ "getrandom",
+ "hashbrown 0.14.0",
+ "lexical-core",
+ "lz4",
+ "multiversion",
+ "num-traits",
+ "parquet2",
+ "rustc_version",
+ "simdutf8",
+ "streaming-iterator",
+ "strength_reduce",
+ "zstd",
+]
+
 [[package]]
 name = "ndarray"
 version = "0.15.6"
@@ -1417,13 +1408,13 @@ dependencies = [
 name = "polars-arrow"
 version = "0.33.2"
 dependencies = [
- "arrow2",
  "atoi",
  "chrono",
  "chrono-tz",
  "ethnum",
  "hashbrown 0.14.0",
  "multiversion",
+ "nano-arrow",
  "num-traits",
  "polars-error",
  "serde",
@@ -1436,7 +1427,6 @@ name = "polars-core"
 version = "0.33.2"
 dependencies = [
  "ahash",
- "arrow2",
  "bitflags 2.4.0",
  "chrono",
  "chrono-tz",
@@ -1445,6 +1435,7 @@ dependencies = [
  "hashbrown 0.14.0",
  "indexmap",
  "itoap",
+ "nano-arrow",
  "ndarray",
  "num-traits",
  "once_cell",
@@ -1468,7 +1459,7 @@ dependencies = [
 name = "polars-error"
 version = "0.33.2"
 dependencies = [
- "arrow2",
+ "nano-arrow",
  "regex",
  "thiserror",
 ]
@@ -1477,7 +1468,7 @@ dependencies = [
 name = "polars-ffi"
 version = "0.33.2"
 dependencies = [
- "arrow2",
+ "nano-arrow",
  "polars-core",
 ]
 
@@ -1486,7 +1477,6 @@ name = "polars-io"
 version = "0.33.2"
 dependencies = [
  "ahash",
- "arrow2",
  "bytes",
  "chrono",
  "chrono-tz",
@@ -1497,6 +1487,7 @@ dependencies = [
  "lexical-core",
  "memchr",
  "memmap2",
+ "nano-arrow",
  "num-traits",
  "once_cell",
  "polars-arrow",
@@ -1518,15 +1509,18 @@ name = "polars-json"
 version = "0.33.2"
 dependencies = [
  "ahash",
- "arrow2",
+ "chrono",
  "fallible-streaming-iterator",
  "hashbrown 0.14.0",
  "indexmap",
+ "lexical-core",
+ "nano-arrow",
  "num-traits",
  "polars-arrow",
  "polars-error",
  "polars-utils",
  "simd-json",
+ "streaming-iterator",
 ]
 
 [[package]]
@@ -1557,7 +1551,6 @@ name = "polars-ops"
 version = "0.33.2"
 dependencies = [
  "argminmax",
- "arrow2",
  "base64",
  "chrono",
  "chrono-tz",
@@ -1566,6 +1559,7 @@ dependencies = [
  "indexmap",
  "jsonpath_lib",
  "memchr",
+ "nano-arrow",
  "polars-arrow",
  "polars-core",
  "polars-json",
@@ -1603,11 +1597,11 @@ name = "polars-plan"
 version = "0.33.2"
 dependencies = [
  "ahash",
- "arrow2",
  "chrono",
  "chrono-tz",
  "ciborium",
  "libloading",
+ "nano-arrow",
  "once_cell",
  "polars-arrow",
  "polars-core",
@@ -1629,7 +1623,7 @@ dependencies = [
 name = "polars-row"
 version = "0.33.2"
 dependencies = [
- "arrow2",
+ "nano-arrow",
  "polars-error",
  "polars-utils",
 ]
@@ -1651,10 +1645,10 @@ dependencies = [
 name = "polars-time"
 version = "0.33.2"
 dependencies = [
- "arrow2",
  "atoi",
  "chrono",
  "chrono-tz",
+ "nano-arrow",
  "now",
  "once_cell",
  "polars-arrow",