diff --git a/arrow-row/src/lib.rs b/arrow-row/src/lib.rs
index 078c4574775d..e6c2293f7ce4 100644
--- a/arrow-row/src/lib.rs
+++ b/arrow-row/src/lib.rs
@@ -180,6 +180,7 @@ use arrow_array::types::{Int16Type, Int32Type, Int64Type};
 
 mod fixed;
 mod list;
+pub mod radix;
 mod run;
 mod variable;
 
@@ -1451,6 +1452,31 @@ impl<'a> Row<'a> {
     pub fn data(&self) -> &'a [u8] {
         self.data
     }
+
+    /// The byte at `offset`, or 0 if `offset` is past the end of the row.
+    #[inline]
+    pub fn byte_from(&self, offset: usize) -> u8 {
+        if offset < self.data.len() {
+            // SAFETY: bounds checked above
+            unsafe { *self.data.get_unchecked(offset) }
+        } else {
+            0
+        }
+    }
+
+    /// The row's bytes starting at `offset`, or an empty slice if
+    /// `offset` exceeds the row length.
+    ///
+    /// Useful for comparing rows that share a known prefix (e.g.,
+    /// after radix sort has already discriminated on earlier bytes).
+    pub fn data_from(&self, offset: usize) -> &'a [u8] {
+        if offset <= self.data.len() {
+            // SAFETY: bounds checked above
+            unsafe { self.data.get_unchecked(offset..) }
+        } else {
+            &[]
+        }
+    }
 }
 
 // Manually derive these as don't wish to include `fields`
diff --git a/arrow-row/src/radix.rs b/arrow-row/src/radix.rs
new file mode 100644
index 000000000000..7262ea814169
--- /dev/null
+++ b/arrow-row/src/radix.rs
@@ -0,0 +1,759 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! MSD radix sort on row-encoded keys.
+//!
+//! The Arrow row format produces big-endian, memcmp-comparable byte sequences,
+//! making it ideal for MSD (Most Significant Digit) radix sort without any
+//! additional encoding. This gives O(n × key_width) performance instead of
+//! O(n log n × comparison_cost).
+//!
+//! # When to use this
+//!
+//! Radix sort is the fastest strategy when sorting by **two or more columns**,
+//! especially as N grows. It benefits from:
+//! - **Multi-column schemas** where comparison sort must traverse columns
+//!   per comparison, while radix sort pays a fixed cost per byte position
+//! - **String columns**, where the row encoding produces compact,
+//!   high-entropy byte sequences that radix passes discriminate quickly
+//! - **Mixed column types** (primitives, strings, dicts, lists)
+//!
+//! # When NOT to use this
+//!
+//! Prefer [`lexsort_to_indices`] when:
+//! - **Sorting by a single column.** The row encoding overhead (allocation,
+//!   encoding, indirection through `Rows`) outweighs the radix advantage.
+//!   Single-column sorts are faster with direct comparison sort on the
+//!   columnar array, which avoids encoding entirely.
+//! - **All sort columns are low-cardinality dictionaries** with no
+//!   high-cardinality column to break ties. The row encoding for
+//!   dictionary values produces long shared prefixes, and radix sort
+//!   gains little from its first few byte passes before falling back
+//!   to comparison sort.
+//! - **Columns with low-entropy leading bytes**, such as `Decimal128` or
+//!   `Decimal256`. These types are encoded as 16- or 32-byte big-endian
+//!   integers, but real-world values occupy a tiny fraction of the range.
+//!   The leading bytes are nearly identical across rows (e.g., `0x80` for
+//!   small positive values), so radix passes burn through the max depth
+//!   without discriminating rows, then fall back to comparison sort.
+//! - **A leading primitive column discriminates most rows and a trailing
+//!   column is expensive to encode** (e.g., lists). [`lexsort_to_indices`]
+//!   avoids encoding the trailing column for rows already resolved by
+//!   the leading column.
+//!
+//! [`lexsort_to_indices`]: https://docs.rs/arrow-ord/latest/arrow_ord/sort/fn.lexsort_to_indices.html
+
+use crate::Rows;
+
+/// Buckets smaller than this fall back to comparison sort. A lower
+/// threshold favors the comparison path, which avoids the ping-pong
+/// buffer overhead and per-level indirection cost of radix passes on
+/// small buckets where O(n log n) comparison sort is already cheap.
+const FALLBACK_THRESHOLD: usize = 32;
+
+/// Maximum number of radix passes before falling back to comparison
+/// sort. Each pass chases pointers through the Rows offset/buffer
+/// indirection, so deeper passes hit diminishing returns as buckets
+/// shrink and the per-level overhead dominates. 8 bytes covers the
+/// discriminating prefix of most key layouts including skewed or
+/// narrow-range distributions; remaining ties are resolved by
+/// comparison sort on the suffix.
+const MAX_DEPTH: usize = 8;
+
+/// Sort row indices using MSD radix sort on row-encoded keys.
+///
+/// Takes [`Rows`] produced by [`RowConverter::convert_columns`] and returns
+/// a `Vec<u32>` of row indices in sorted order. The caller is responsible for
+/// encoding columns into row format and for using the returned indices to
+/// reorder the original arrays (e.g., via [`take`]).
+///
+/// See the [module-level documentation](self) for guidance on when radix sort
+/// is faster than [`lexsort_to_indices`].
+///
+/// # Example
+///
+/// ```
+/// # use std::sync::Arc;
+/// # use arrow_row::{RowConverter, SortField};
+/// # use arrow_row::radix::radix_sort_to_indices;
+/// # use arrow_array::{Int32Array, ArrayRef};
+/// # use arrow_schema::DataType;
+/// let array: ArrayRef = Arc::new(Int32Array::from(vec![5, 3, 1, 4, 2]));
+/// let converter = RowConverter::new(vec![SortField::new(DataType::Int32)]).unwrap();
+/// let rows = converter.convert_columns(&[array]).unwrap();
+/// let indices = radix_sort_to_indices(&rows);
+/// assert_eq!(indices, vec![2, 4, 1, 3, 0]); // points to [1, 2, 3, 4, 5]
+/// ```
+///
+/// [`RowConverter::convert_columns`]: crate::RowConverter::convert_columns
+/// [`take`]: https://docs.rs/arrow/latest/arrow/compute/fn.take.html
+/// [`lexsort_to_indices`]: https://docs.rs/arrow-ord/latest/arrow_ord/sort/fn.lexsort_to_indices.html
+pub fn radix_sort_to_indices(rows: &Rows) -> Vec<u32> {
+    radix_sort_to_indices_with(rows, MAX_DEPTH, FALLBACK_THRESHOLD)
+}
+
+/// Like [`radix_sort_to_indices`] but with tunable parameters for
+/// benchmarking. `max_depth` controls how many radix passes to run
+/// before falling back to comparison sort. `fallback_threshold` is
+/// the bucket size below which we switch to comparison sort.
+pub fn radix_sort_to_indices_with(
+    rows: &Rows,
+    max_depth: usize,
+    fallback_threshold: usize,
+) -> Vec<u32> {
+    let n = rows.num_rows();
+    let mut indices: Vec<u32> = (0..n as u32).collect();
+    let mut temp = vec![0u32; n];
+    let mut bytes = vec![0u8; n];
+    let config = RadixSortConfig {
+        max_depth,
+        fallback_threshold,
+    };
+    msd_radix_sort(&mut indices, &mut temp, &mut bytes, rows, 0, true, &config);
+    indices
+}
+
+/// Tunable parameters for MSD radix sort.
+struct RadixSortConfig {
+    /// Maximum number of radix passes before falling back to comparison sort.
+    max_depth: usize,
+    /// Buckets smaller than this fall back to comparison sort.
+    fallback_threshold: usize,
+}
+
+impl Default for RadixSortConfig {
+    fn default() -> Self {
+        Self {
+            max_depth: MAX_DEPTH,
+            fallback_threshold: FALLBACK_THRESHOLD,
+        }
+    }
+}
+///
+/// # Safety
+/// `idx` must be a valid row index in `rows`.
+#[inline(always)]
+unsafe fn row_byte(rows: &Rows, idx: u32, byte_pos: usize) -> u8 {
+    // SAFETY: caller guarantees idx is a valid row index
+    unsafe { rows.row_unchecked(idx as usize) }.byte_from(byte_pos)
+}
+
+/// MSD radix sort using ping-pong buffers.
+///
+/// Each level scatters from `src` into `dst`, then recurses with the
+/// roles swapped (dst becomes the next level's src). This avoids an
+/// O(n) `copy_from_slice` at every recursion level.
+///
+/// `result_in_src` tracks where the caller expects the sorted output:
+/// true means `src`, false means `dst`. It flips at each scatter so
+/// the final result lands in the right buffer. The top-level call
+/// passes `true` so the answer ends up in `indices`.
+fn msd_radix_sort(
+    src: &mut [u32],
+    dst: &mut [u32],
+    bytes: &mut [u8],
+    rows: &Rows,
+    byte_pos: usize,
+    result_in_src: bool,
+    config: &RadixSortConfig,
+) {
+    let n = src.len();
+
+    if n <= config.fallback_threshold || byte_pos >= config.max_depth {
+        // Compare only from byte_pos onward — earlier bytes are identical
+        // within this bucket, having already been discriminated by radix
+        // passes above us. Safe slice via get() is needed because rows of
+        // different lengths can share a bucket when a shorter row's
+        // past-end default (0) matches a longer row's real byte value.
+        //
+        // When !result_in_src the caller expects the output in dst, so
+        // we copy first and sort in place there.
+        if result_in_src {
+            src.sort_unstable_by(|&a, &b| {
+                // SAFETY: indices contains a permutation of 0..rows.num_rows()
+                let ra = unsafe { rows.row_unchecked(a as usize) };
+                let rb = unsafe { rows.row_unchecked(b as usize) };
+                ra.data_from(byte_pos).cmp(rb.data_from(byte_pos))
+            });
+        } else {
+            dst.copy_from_slice(src);
+            dst.sort_unstable_by(|&a, &b| {
+                // SAFETY: indices contains a permutation of 0..rows.num_rows()
+                let ra = unsafe { rows.row_unchecked(a as usize) };
+                let rb = unsafe { rows.row_unchecked(b as usize) };
+                ra.data_from(byte_pos).cmp(rb.data_from(byte_pos))
+            });
+        }
+        return;
+    }
+
+    // Extract bytes and build histogram in one pass. The bytes buffer
+    // is reused across levels so the scatter loop can read from a flat
+    // array instead of chasing pointers through Rows a second time.
+    let bytes = &mut bytes[..n];
+    let mut counts = [0u32; 256];
+    for (i, &idx) in src.iter().enumerate() {
+        // SAFETY: src contains valid row indices
+        let b = unsafe { row_byte(rows, idx, byte_pos) };
+        bytes[i] = b;
+        counts[b as usize] += 1;
+    }
+
+    let mut offsets = [0u32; 257];
+    let mut num_buckets = 0u32;
+    for i in 0..256 {
+        num_buckets += (counts[i] > 0) as u32;
+        offsets[i + 1] = offsets[i] + counts[i];
+    }
+
+    // No scatter happened — data is still in src, roles unchanged.
+    if num_buckets == 1 {
+        msd_radix_sort(src, dst, bytes, rows, byte_pos + 1, result_in_src, config);
+        return;
+    }
+
+    // Scatter src → dst using the pre-extracted bytes
+    let mut write_pos = offsets;
+    for (i, &idx) in src.iter().enumerate() {
+        let b = bytes[i] as usize;
+        dst[write_pos[b] as usize] = idx;
+        write_pos[b] += 1;
+    }
+
+    // Recurse with roles swapped: after scatter the data lives in dst,
+    // so dst becomes the next level's src. Flipping result_in_src
+    // ensures each level's output lands where the caller above expects.
+    for bucket in 0..256 {
+        let start = offsets[bucket] as usize;
+        let end = offsets[bucket + 1] as usize;
+        let len = end - start;
+        if len > 1 {
+            msd_radix_sort(
+                &mut dst[start..end],
+                &mut src[start..end],
+                &mut bytes[start..end],
+                rows,
+                byte_pos + 1,
+                !result_in_src,
+                config,
+            );
+        } else if len == 1 && result_in_src {
+            // Single-element bucket doesn't recurse. After scatter
+            // the element is in dst; copy it back if the caller
+            // expects the result in src.
+            src[start] = dst[start];
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::{RowConverter, SortField};
+    use arrow_array::{ArrayRef, BooleanArray, Float64Array, Int32Array, StringArray};
+    use arrow_schema::{DataType, SortOptions};
+    use rand::rngs::StdRng;
+    use rand::{Rng, SeedableRng};
+    use std::sync::Arc;
+
+    fn assert_sorted(rows: &Rows, indices: &[u32]) {
+        for i in 1..indices.len() {
+            let a = rows.row(indices[i - 1] as usize);
+            let b = rows.row(indices[i] as usize);
+            assert!(
+                a <= b,
+                "row {} should be <= row {}",
+                indices[i - 1],
+                indices[i]
+            );
+        }
+    }
+
+    #[test]
+    fn test_radix_sort_integers() {
+        let array: ArrayRef = Arc::new(Int32Array::from(vec![5, 3, 1, 4, 2]));
+        let converter = RowConverter::new(vec![SortField::new(DataType::Int32)]).unwrap();
+        let rows = converter.convert_columns(&[array]).unwrap();
+
+        let indices = radix_sort_to_indices(&rows);
+        assert_sorted(&rows, &indices);
+        assert_eq!(indices, vec![2, 4, 1, 3, 0]);
+    }
+
+    #[test]
+    fn test_radix_sort_strings() {
+        let array: ArrayRef =
+            Arc::new(StringArray::from(vec!["banana", "apple", "cherry", "date"]));
+        let converter = RowConverter::new(vec![SortField::new(DataType::Utf8)]).unwrap();
+        let rows = converter.convert_columns(&[array]).unwrap();
+
+        let indices = radix_sort_to_indices(&rows);
+        assert_sorted(&rows, &indices);
+        assert_eq!(indices, vec![1, 0, 2, 3]);
+    }
+
+    #[test]
+    fn test_radix_sort_with_nulls() {
+        let array: ArrayRef = Arc::new(Int32Array::from(vec![
+            Some(3),
+            None,
+            Some(1),
+            None,
+            Some(2),
+        ]));
+        let converter = RowConverter::new(vec![SortField::new(DataType::Int32)]).unwrap();
+        let rows = converter.convert_columns(&[array]).unwrap();
+
+        let indices = radix_sort_to_indices(&rows);
+        assert_sorted(&rows, &indices);
+    }
+
+    #[test]
+    fn test_radix_sort_multi_column() {
+        let a1: ArrayRef = Arc::new(Int32Array::from(vec![1, 1, 2, 2]));
+        let a2: ArrayRef = Arc::new(StringArray::from(vec!["b", "a", "d", "c"]));
+        let converter = RowConverter::new(vec![
+            SortField::new(DataType::Int32),
+            SortField::new(DataType::Utf8),
+        ])
+        .unwrap();
+        let rows = converter.convert_columns(&[a1, a2]).unwrap();
+
+        let indices = radix_sort_to_indices(&rows);
+        assert_sorted(&rows, &indices);
+        assert_eq!(indices, vec![1, 0, 3, 2]);
+    }
+
+    #[test]
+    fn test_radix_sort_empty() {
+        let array: ArrayRef = Arc::new(Int32Array::from(Vec::<i32>::new()));
+        let converter = RowConverter::new(vec![SortField::new(DataType::Int32)]).unwrap();
+        let rows = converter.convert_columns(&[array]).unwrap();
+
+        let indices = radix_sort_to_indices(&rows);
+        assert!(indices.is_empty());
+    }
+
+    #[test]
+    fn test_radix_sort_single_element() {
+        let array: ArrayRef = Arc::new(Int32Array::from(vec![42]));
+        let converter = RowConverter::new(vec![SortField::new(DataType::Int32)]).unwrap();
+        let rows = converter.convert_columns(&[array]).unwrap();
+
+        let indices = radix_sort_to_indices(&rows);
+        assert_eq!(indices, vec![0]);
+    }
+
+    #[test]
+    fn test_radix_sort_all_equal() {
+        let array: ArrayRef = Arc::new(Int32Array::from(vec![7, 7, 7, 7, 7]));
+        let converter = RowConverter::new(vec![SortField::new(DataType::Int32)]).unwrap();
+        let rows = converter.convert_columns(&[array]).unwrap();
+
+        let indices = radix_sort_to_indices(&rows);
+        assert_sorted(&rows, &indices);
+    }
+
+    #[test]
+    fn test_radix_sort_descending() {
+        let array: ArrayRef = Arc::new(Int32Array::from(vec![1, 3, 2, 5, 4]));
+        let options = SortOptions::default().desc();
+        let converter =
+            RowConverter::new(vec![SortField::new_with_options(DataType::Int32, options)]).unwrap();
+        let rows = converter.convert_columns(&[array]).unwrap();
+
+        let indices = radix_sort_to_indices(&rows);
+        assert_sorted(&rows, &indices);
+    }
+
+    #[test]
+    fn test_radix_sort_nulls_first() {
+        let array: ArrayRef = Arc::new(Int32Array::from(vec![
+            Some(3),
+            None,
+            Some(1),
+            None,
+            Some(2),
+        ]));
+        let options = SortOptions::default().with_nulls_first(true);
+        let converter =
+            RowConverter::new(vec![SortField::new_with_options(DataType::Int32, options)]).unwrap();
+        let rows = converter.convert_columns(&[array]).unwrap();
+
+        let indices = radix_sort_to_indices(&rows);
+        assert_sorted(&rows, &indices);
+    }
+
+    #[test]
+    fn test_radix_sort_descending_nulls_first() {
+        let array: ArrayRef = Arc::new(Int32Array::from(vec![
+            Some(3),
+            None,
+            Some(1),
+            None,
+            Some(2),
+        ]));
+        let options = SortOptions::default().desc().with_nulls_first(true);
+        let converter =
+            RowConverter::new(vec![SortField::new_with_options(DataType::Int32, options)]).unwrap();
+        let rows = converter.convert_columns(&[array]).unwrap();
+
+        let indices = radix_sort_to_indices(&rows);
+        assert_sorted(&rows, &indices);
+    }
+
+    #[test]
+    fn test_radix_sort_all_sort_option_combos() {
+        let array: ArrayRef = Arc::new(Int32Array::from(vec![
+            Some(5),
+            None,
+            Some(3),
+            None,
+            Some(1),
+            Some(4),
+            Some(2),
+        ]));
+
+        for descending in [false, true] {
+            for nulls_first in [false, true] {
+                let options = SortOptions {
+                    descending,
+                    nulls_first,
+                };
+                let converter =
+                    RowConverter::new(vec![SortField::new_with_options(DataType::Int32, options)])
+                        .unwrap();
+                let rows = converter
+                    .convert_columns(std::slice::from_ref(&array))
+                    .unwrap();
+
+                let indices = radix_sort_to_indices(&rows);
+                assert_sorted(&rows, &indices);
+            }
+        }
+    }
+
+    #[test]
+    fn test_radix_sort_floats_with_nan() {
+        let array: ArrayRef = Arc::new(Float64Array::from(vec![
+            Some(1.0),
+            Some(f64::NAN),
+            None,
+            Some(-1.0),
+            Some(f64::INFINITY),
+            Some(f64::NEG_INFINITY),
+            Some(0.0),
+        ]));
+        let converter = RowConverter::new(vec![SortField::new(DataType::Float64)]).unwrap();
+        let rows = converter.convert_columns(&[array]).unwrap();
+
+        let indices = radix_sort_to_indices(&rows);
+        assert_sorted(&rows, &indices);
+    }
+
+    #[test]
+    fn test_radix_sort_booleans() {
+        let array: ArrayRef = Arc::new(BooleanArray::from(vec![
+            Some(true),
+            None,
+            Some(false),
+            Some(true),
+            None,
+            Some(false),
+        ]));
+        let converter = RowConverter::new(vec![SortField::new(DataType::Boolean)]).unwrap();
+        let rows = converter.convert_columns(&[array]).unwrap();
+
+        let indices = radix_sort_to_indices(&rows);
+        assert_sorted(&rows, &indices);
+    }
+
+    // Tests sizes around the FALLBACK_THRESHOLD (64) to exercise both paths
+    #[test]
+    fn test_radix_sort_threshold_boundary() {
+        let mut rng = StdRng::seed_from_u64(0xCAFE);
+        for n in [1, 2, 32, 63, 64, 65, 100, 128, 256, 500, 1000] {
+            let values: Vec<Option<i32>> = (0..n)
+                .map(|_| {
+                    if rng.random_bool(0.1) {
+                        None
+                    } else {
+                        Some(rng.random_range(-1000..1000))
+                    }
+                })
+                .collect();
+            let array: ArrayRef = Arc::new(Int32Array::from(values));
+            let converter = RowConverter::new(vec![SortField::new(DataType::Int32)]).unwrap();
+            let rows = converter.convert_columns(&[array]).unwrap();
+
+            let indices = radix_sort_to_indices(&rows);
+            assert_sorted(&rows, &indices);
+            assert_eq!(indices.len(), n, "wrong number of indices for n={n}");
+        }
+    }
+
+    /// Generate random arrays and verify radix sort produces correctly sorted output
+    /// across random column types, sort options, and sizes.
+    #[test]
+    fn test_radix_sort_fuzz() {
+        let mut rng = StdRng::seed_from_u64(0xF00D);
+
+        for iteration in 0..100 {
+            let num_columns = rng.random_range(1..=4);
+            let len = rng.random_range(5..500);
+
+            let mut arrays: Vec<ArrayRef> = Vec::new();
+            let mut fields: Vec<SortField> = Vec::new();
+
+            for _ in 0..num_columns {
+                let options = SortOptions {
+                    descending: rng.random_bool(0.5),
+                    nulls_first: rng.random_bool(0.5),
+                };
+                let null_rate = if rng.random_bool(0.3) { 0.0 } else { 0.2 };
+
+                // Pick a random column type
+                let (array, dt) = match rng.random_range(0..7) {
+                    0 => {
+                        let vals: Vec<Option<i32>> = (0..len)
+                            .map(|_| {
+                                if rng.random_bool(null_rate) {
+                                    None
+                                } else {
+                                    Some(rng.random_range(-10000..10000))
+                                }
+                            })
+                            .collect();
+                        (
+                            Arc::new(Int32Array::from(vals)) as ArrayRef,
+                            DataType::Int32,
+                        )
+                    }
+                    1 => {
+                        let vals: Vec<Option<i64>> = (0..len)
+                            .map(|_| {
+                                if rng.random_bool(null_rate) {
+                                    None
+                                } else {
+                                    Some(rng.random())
+                                }
+                            })
+                            .collect();
+                        (
+                            Arc::new(arrow_array::Int64Array::from(vals)) as ArrayRef,
+                            DataType::Int64,
+                        )
+                    }
+                    2 => {
+                        let vals: Vec<Option<f64>> = (0..len)
+                            .map(|_| {
+                                if rng.random_bool(null_rate) {
+                                    None
+                                } else {
+                                    Some(rng.random::<f64>() * 1000.0 - 500.0)
+                                }
+                            })
+                            .collect();
+                        (
+                            Arc::new(Float64Array::from(vals)) as ArrayRef,
+                            DataType::Float64,
+                        )
+                    }
+                    3 => {
+                        let vals: Vec<Option<&str>> = (0..len)
+                            .map(|_| {
+                                if rng.random_bool(null_rate) {
+                                    None
+                                } else {
+                                    // Fixed set of strings to get some collisions
+                                    Some(
+                                        [
+                                            "alpha",
+                                            "beta",
+                                            "gamma",
+                                            "delta",
+                                            "epsilon",
+                                            "zeta",
+                                            "eta",
+                                            "theta",
+                                            "iota",
+                                            "kappa",
+                                            "a longer string for testing",
+                                            "",
+                                        ][rng.random_range(0..12)],
+                                    )
+                                }
+                            })
+                            .collect();
+                        (
+                            Arc::new(StringArray::from(vals)) as ArrayRef,
+                            DataType::Utf8,
+                        )
+                    }
+                    4 => {
+                        let vals: Vec<Option<bool>> = (0..len)
+                            .map(|_| {
+                                if rng.random_bool(null_rate) {
+                                    None
+                                } else {
+                                    Some(rng.random_bool(0.5))
+                                }
+                            })
+                            .collect();
+                        (
+                            Arc::new(BooleanArray::from(vals)) as ArrayRef,
+                            DataType::Boolean,
+                        )
+                    }
+                    5 => {
+                        // Low-cardinality i32 to create many ties
+                        let vals: Vec<Option<i32>> = (0..len)
+                            .map(|_| {
+                                if rng.random_bool(null_rate) {
+                                    None
+                                } else {
+                                    Some(rng.random_range(0..5))
+                                }
+                            })
+                            .collect();
+                        (
+                            Arc::new(Int32Array::from(vals)) as ArrayRef,
+                            DataType::Int32,
+                        )
+                    }
+                    _ => {
+                        // All-null column
+                        let vals: Vec<Option<i32>> = vec![None; len];
+                        (
+                            Arc::new(Int32Array::from(vals)) as ArrayRef,
+                            DataType::Int32,
+                        )
+                    }
+                };
+
+                arrays.push(array);
+                fields.push(SortField::new_with_options(dt, options));
+            }
+
+            let converter = RowConverter::new(fields).unwrap();
+            let rows = converter.convert_columns(&arrays).unwrap();
+
+            let indices = radix_sort_to_indices(&rows);
+            assert_sorted(&rows, &indices);
+            assert_eq!(
+                indices.len(),
+                len,
+                "iteration {iteration}: wrong index count"
+            );
+
+            // Verify every original index appears exactly once
+            let mut seen = vec![false; len];
+            for &idx in &indices {
+                assert!(
+                    !seen[idx as usize],
+                    "iteration {iteration}: duplicate index {idx}"
+                );
+                seen[idx as usize] = true;
+            }
+        }
+    }
+
+    /// Verify radix sort matches comparison sort on row-encoded keys.
+    /// Uses the same Rows, so any difference is a bug in the radix sort itself.
+    #[test]
+    fn test_radix_matches_comparison_sort() {
+        let mut rng = StdRng::seed_from_u64(0xBEEF);
+
+        for _ in 0..50 {
+            let len = rng.random_range(100..1000);
+            let vals: Vec<Option<i32>> = (0..len)
+                .map(|_| {
+                    if rng.random_bool(0.15) {
+                        None
+                    } else {
+                        Some(rng.random_range(-500..500))
+                    }
+                })
+                .collect();
+
+            let options = SortOptions {
+                descending: rng.random_bool(0.5),
+                nulls_first: rng.random_bool(0.5),
+            };
+
+            let array: ArrayRef = Arc::new(Int32Array::from(vals));
+            let converter =
+                RowConverter::new(vec![SortField::new_with_options(DataType::Int32, options)])
+                    .unwrap();
+            let rows = converter.convert_columns(&[array]).unwrap();
+
+            let radix = radix_sort_to_indices(&rows);
+
+            let mut comparison: Vec<u32> = (0..len as u32).collect();
+            comparison.sort_unstable_by(|&a, &b| rows.row(a as usize).cmp(&rows.row(b as usize)));
+
+            // Both sorts operate on the same rows, so equal-keyed elements
+            // should appear in the same relative order only if both are stable
+            // (they aren't), but the *row values* at each position must match.
+            for i in 0..len {
+                let radix_row = rows.row(radix[i] as usize);
+                let cmp_row = rows.row(comparison[i] as usize);
+                assert_eq!(
+                    radix_row, cmp_row,
+                    "mismatch at position {i}: radix idx={} vs comparison idx={}",
+                    radix[i], comparison[i]
+                );
+            }
+        }
+    }
+
+    /// Test with a multi-column schema that has mixed sort options per column.
+    #[test]
+    fn test_radix_sort_multi_column_mixed_options() {
+        let a1: ArrayRef = Arc::new(Int32Array::from(vec![
+            Some(1),
+            None,
+            Some(1),
+            Some(2),
+            None,
+        ]));
+        let a2: ArrayRef = Arc::new(StringArray::from(vec![
+            Some("z"),
+            Some("a"),
+            Some("a"),
+            None,
+            Some("m"),
+        ]));
+
+        // Col 1: ascending nulls_last, Col 2: descending nulls_first
+        let converter = RowConverter::new(vec![
+            SortField::new_with_options(
+                DataType::Int32,
+                SortOptions::default().asc().with_nulls_first(false),
+            ),
+            SortField::new_with_options(
+                DataType::Utf8,
+                SortOptions::default().desc().with_nulls_first(true),
+            ),
+        ])
+        .unwrap();
+        let rows = converter.convert_columns(&[a1, a2]).unwrap();
+
+        let indices = radix_sort_to_indices(&rows);
+        assert_sorted(&rows, &indices);
+    }
+}
diff --git a/arrow/benches/lexsort.rs b/arrow/benches/lexsort.rs
index 16a2606b919a..50c00684f9de 100644
--- a/arrow/benches/lexsort.rs
+++ b/arrow/benches/lexsort.rs
@@ -16,12 +16,13 @@
 // under the License.
 
 use arrow::compute::{SortColumn, lexsort_to_indices};
+use arrow::row::radix::radix_sort_to_indices;
 use arrow::row::{RowConverter, SortField};
 use arrow::util::bench_util::{
     create_dict_from_values, create_primitive_array, create_string_array_with_len,
 };
 use arrow::util::data_gen::create_random_array;
-use arrow_array::types::Int32Type;
+use arrow_array::types::{Float64Type, Int32Type, Int64Type};
 use arrow_array::{Array, ArrayRef, UInt32Array};
 use arrow_schema::{DataType, Field};
 use criterion::{Criterion, criterion_group, criterion_main};
@@ -31,6 +32,10 @@ use std::{hint, sync::Arc};
 enum Column {
     RequiredI32,
     OptionalI32,
+    RequiredI64,
+    OptionalI64,
+    RequiredF64,
+    OptionalF64,
     Required16CharString,
     Optional16CharString,
     Optional50CharString,
@@ -46,6 +51,10 @@ impl std::fmt::Debug for Column {
         let s = match self {
             Column::RequiredI32 => "i32",
             Column::OptionalI32 => "i32_opt",
+            Column::RequiredI64 => "i64",
+            Column::OptionalI64 => "i64_opt",
+            Column::RequiredF64 => "f64",
+            Column::OptionalF64 => "f64_opt",
             Column::Required16CharString => "str(16)",
             Column::Optional16CharString => "str_opt(16)",
             Column::Optional50CharString => "str_opt(50)",
@@ -64,6 +73,10 @@ impl Column {
         match self {
             Column::RequiredI32 => Arc::new(create_primitive_array::<Int32Type>(size, 0.)),
             Column::OptionalI32 => Arc::new(create_primitive_array::<Int32Type>(size, 0.2)),
+            Column::RequiredI64 => Arc::new(create_primitive_array::<Int64Type>(size, 0.)),
+            Column::OptionalI64 => Arc::new(create_primitive_array::<Int64Type>(size, 0.2)),
+            Column::RequiredF64 => Arc::new(create_primitive_array::<Float64Type>(size, 0.)),
+            Column::OptionalF64 => Arc::new(create_primitive_array::<Float64Type>(size, 0.2)),
             Column::Required16CharString => {
                 Arc::new(create_string_array_with_len::<i32>(size, 0., 16))
             }
@@ -146,10 +159,36 @@ fn do_bench(c: &mut Criterion, columns: &[Column], len: usize) {
             })
         })
     });
+
+    c.bench_function(&format!("lexsort_radix({columns:?}): {len}"), |b| {
+        b.iter(|| {
+            hint::black_box({
+                let fields = arrays
+                    .iter()
+                    .map(|a| SortField::new(a.data_type().clone()))
+                    .collect();
+                let converter = RowConverter::new(fields).unwrap();
+                let rows = converter.convert_columns(&arrays).unwrap();
+                let indices = radix_sort_to_indices(&rows);
+                UInt32Array::from_iter_values(indices)
+            })
+        })
+    });
 }
 
 fn add_benchmark(c: &mut Criterion) {
     let cases: &[&[Column]] = &[
+        // Single-column primitives
+        &[Column::RequiredI32],
+        &[Column::OptionalI32],
+        &[Column::RequiredI64],
+        &[Column::OptionalI64],
+        &[Column::RequiredF64],
+        &[Column::OptionalF64],
+        // Single-column strings
+        &[Column::Required16CharString],
+        &[Column::Optional16CharString],
+        // Multi-column
         &[Column::RequiredI32, Column::OptionalI32],
         &[Column::RequiredI32, Column::Optional16CharString],
         &[Column::RequiredI32, Column::Required16CharString],
@@ -186,12 +225,6 @@ fn add_benchmark(c: &mut Criterion) {
             Column::Optional100Value50CharStringDict,
             Column::Optional50CharString,
         ],
-        &[
-            Column::Optional100Value50CharStringDict,
-            Column::Optional100Value50CharStringDict,
-            Column::Optional100Value50CharStringDict,
-            Column::Optional50CharString,
-        ],
         &[Column::OptionalI32, Column::RequiredI32List],
         &[Column::OptionalI32, Column::OptionalI32List],
         &[Column::OptionalI32List, Column::OptionalI32],