diff --git a/crates/polars-core/Cargo.toml b/crates/polars-core/Cargo.toml
index c9d68f0ee173..13047c5f600b 100644
--- a/crates/polars-core/Cargo.toml
+++ b/crates/polars-core/Cargo.toml
@@ -101,6 +101,7 @@ describe = []
 timezones = ["temporal", "chrono", "chrono-tz", "arrow/chrono-tz", "arrow/timezones"]
 dynamic_group_by = ["dtype-datetime", "dtype-date"]
 arrow_rs = ["arrow-array", "arrow/arrow_rs"]
+list_arithmetic = []
 
 # opt-in datatypes for Series
 dtype-date = ["temporal"]
@@ -148,6 +149,7 @@ docs-selection = [
   "describe",
   "partition_by",
   "algorithm_group_by",
+  "list_arithmetic",
 ]
 
 [package.metadata.docs.rs]
diff --git a/crates/polars-core/src/series/arithmetic/list_borrowed.rs b/crates/polars-core/src/series/arithmetic/list_borrowed.rs
index f59492f71cb9..d1558e7f86fc 100644
--- a/crates/polars-core/src/series/arithmetic/list_borrowed.rs
+++ b/crates/polars-core/src/series/arithmetic/list_borrowed.rs
@@ -1,16 +1,9 @@
 //! Allow arithmetic operations for ListChunked.
+//! use polars_error::{feature_gated, PolarsResult};
 
-use arrow::bitmap::Bitmap;
-use arrow::compute::utils::combine_validities_and;
-use arrow::offset::OffsetsBuffer;
-use either::Either;
-use num_traits::Zero;
-use polars_compute::arithmetic::pl_num::PlNumArithmetic;
-use polars_compute::arithmetic::ArithmeticKernel;
-use polars_compute::comparisons::TotalEqKernel;
-use polars_utils::float::IsFloat;
+use polars_error::{feature_gated, PolarsResult};
 
-use super::*;
+use super::{IntoSeries, ListChunked, ListType, NumOpsDispatchInner, Series};
 
 impl NumOpsDispatchInner for ListType {
     fn add_to(lhs: &ListChunked, rhs: &Series) -> PolarsResult<Series> {
@@ -45,136 +38,161 @@ pub enum NumericListOp {
 }
 
 impl NumericListOp {
-    fn name(&self) -> &'static str {
-        match self {
-            Self::Add => "add",
-            Self::Sub => "sub",
-            Self::Mul => "mul",
-            Self::Div => "div",
-            Self::Rem => "rem",
-            Self::FloorDiv => "floor_div",
-        }
-    }
-
-    pub fn try_get_leaf_supertype(
-        &self,
-        prim_dtype_lhs: &DataType,
-        prim_dtype_rhs: &DataType,
-    ) -> PolarsResult<DataType> {
-        let dtype = try_get_supertype(prim_dtype_lhs, prim_dtype_rhs)?;
-
-        Ok(if matches!(self, Self::Div) {
-            if dtype.is_float() {
-                dtype
-            } else {
-                DataType::Float64
-            }
-        } else {
-            dtype
-        })
-    }
-
+    #[cfg_attr(not(feature = "list_arithmetic"), allow(unused))]
     pub fn execute(&self, lhs: &Series, rhs: &Series) -> PolarsResult<Series> {
-        // Ideally we only need to rechunk the leaf array, but getting the
-        // list offsets of a ListChunked triggers a rechunk anyway, so we just
-        // do it here.
-        let lhs = lhs.rechunk();
-        let rhs = rhs.rechunk();
-
-        let binary_op_exec = match BinaryListNumericOpHelper::try_new(
-            self.clone(),
-            lhs.name().clone(),
-            lhs.dtype(),
-            rhs.dtype(),
-            lhs.len(),
-            rhs.len(),
-            {
-                let (a, b) = lhs.list_offsets_and_validities_recursive();
-                (a, b, lhs.clone())
-            },
-            {
-                let (a, b) = rhs.list_offsets_and_validities_recursive();
-                (a, b, rhs.clone())
-            },
-            lhs.rechunk_validity(),
-            rhs.rechunk_validity(),
-        )? {
-            Either::Left(v) => v,
-            Either::Right(ca) => return Ok(ca.into_series()),
-        };
-
-        Ok(binary_op_exec.finish()?.into_series())
+        feature_gated!("list_arithmetic", {
+            use either::Either;
+
+            // Ideally we only need to rechunk the leaf array, but getting the
+            // list offsets of a ListChunked triggers a rechunk anyway, so we just
+            // do it here.
+            let lhs = lhs.rechunk();
+            let rhs = rhs.rechunk();
+
+            let binary_op_exec = match BinaryListNumericOpHelper::try_new(
+                self.clone(),
+                lhs.name().clone(),
+                lhs.dtype(),
+                rhs.dtype(),
+                lhs.len(),
+                rhs.len(),
+                {
+                    let (a, b) = lhs.list_offsets_and_validities_recursive();
+                    (a, b, lhs.clone())
+                },
+                {
+                    let (a, b) = rhs.list_offsets_and_validities_recursive();
+                    (a, b, rhs.clone())
+                },
+                lhs.rechunk_validity(),
+                rhs.rechunk_validity(),
+            )? {
+                Either::Left(v) => v,
+                Either::Right(ca) => return Ok(ca.into_series()),
+            };
+
+            Ok(binary_op_exec.finish()?.into_series())
+        })
     }
+}
 
-    /// For operations that perform divisions on integers, sets the validity to NULL on rows where
-    /// the denominator is 0.
-    fn prepare_numeric_op_side_validities<T: PolarsNumericType>(
-        &self,
-        lhs: &mut PrimitiveArray<T::Native>,
-        rhs: &mut PrimitiveArray<T::Native>,
-        swapped: bool,
-    ) where
-        PrimitiveArray<T::Native>: polars_compute::comparisons::TotalEqKernel<Scalar = T::Native>,
-        T::Native: Zero + IsFloat,
-    {
-        if !T::Native::is_float() {
+#[cfg(feature = "list_arithmetic")]
+use inner::BinaryListNumericOpHelper;
+
+#[cfg(feature = "list_arithmetic")]
+mod inner {
+    use arrow::bitmap::Bitmap;
+    use arrow::compute::utils::combine_validities_and;
+    use arrow::offset::OffsetsBuffer;
+    use either::Either;
+    use num_traits::Zero;
+    use polars_compute::arithmetic::pl_num::PlNumArithmetic;
+    use polars_compute::arithmetic::ArithmeticKernel;
+    use polars_compute::comparisons::TotalEqKernel;
+    use polars_utils::float::IsFloat;
+
+    use super::super::*;
+
+    impl NumericListOp {
+        fn name(&self) -> &'static str {
             match self {
-                Self::Div | Self::Rem | Self::FloorDiv => {
-                    let target = if swapped { lhs } else { rhs };
-                    let ne_0 = target.tot_ne_kernel_broadcast(&T::Native::zero());
-                    let validity = combine_validities_and(target.validity(), Some(&ne_0));
-                    target.set_validity(validity);
-                },
-                _ => {},
+                Self::Add => "add",
+                Self::Sub => "sub",
+                Self::Mul => "mul",
+                Self::Div => "div",
+                Self::Rem => "rem",
+                Self::FloorDiv => "floor_div",
             }
         }
-    }
 
-    /// For list<->primitive where the primitive is broadcasted, we can dispatch to
-    /// `ArithmeticKernel`, which can have optimized codepaths for when one side is
-    /// a scalar.
-    fn apply_array_to_scalar<T: PolarsNumericType>(
-        &self,
-        arr_lhs: PrimitiveArray<T::Native>,
-        r: T::Native,
-        swapped: bool,
-    ) -> PrimitiveArray<T::Native> {
-        match self {
-            Self::Add => ArithmeticKernel::wrapping_add_scalar(arr_lhs, r),
-            Self::Sub => {
-                if swapped {
-                    ArithmeticKernel::wrapping_sub_scalar_lhs(r, arr_lhs)
-                } else {
-                    ArithmeticKernel::wrapping_sub_scalar(arr_lhs, r)
-                }
-            },
-            Self::Mul => ArithmeticKernel::wrapping_mul_scalar(arr_lhs, r),
-            Self::Div => {
-                if swapped {
-                    ArithmeticKernel::legacy_div_scalar_lhs(r, arr_lhs)
-                } else {
-                    ArithmeticKernel::legacy_div_scalar(arr_lhs, r)
-                }
-            },
-            Self::Rem => {
-                if swapped {
-                    ArithmeticKernel::wrapping_mod_scalar_lhs(r, arr_lhs)
+        fn try_get_leaf_supertype(
+            &self,
+            prim_dtype_lhs: &DataType,
+            prim_dtype_rhs: &DataType,
+        ) -> PolarsResult<DataType> {
+            let dtype = try_get_supertype(prim_dtype_lhs, prim_dtype_rhs)?;
+
+            Ok(if matches!(self, Self::Div) {
+                if dtype.is_float() {
+                    dtype
                 } else {
-                    ArithmeticKernel::wrapping_mod_scalar(arr_lhs, r)
+                    DataType::Float64
                 }
-            },
-            Self::FloorDiv => {
-                if swapped {
-                    ArithmeticKernel::wrapping_floor_div_scalar_lhs(r, arr_lhs)
-                } else {
-                    ArithmeticKernel::wrapping_floor_div_scalar(arr_lhs, r)
+            } else {
+                dtype
+            })
+        }
+
+        /// For operations that perform divisions on integers, sets the validity to NULL on rows where
+        /// the denominator is 0.
+        fn prepare_numeric_op_side_validities<T: PolarsNumericType>(
+            &self,
+            lhs: &mut PrimitiveArray<T::Native>,
+            rhs: &mut PrimitiveArray<T::Native>,
+            swapped: bool,
+        ) where
+            PrimitiveArray<T::Native>:
+                polars_compute::comparisons::TotalEqKernel<Scalar = T::Native>,
+            T::Native: Zero + IsFloat,
+        {
+            if !T::Native::is_float() {
+                match self {
+                    Self::Div | Self::Rem | Self::FloorDiv => {
+                        let target = if swapped { lhs } else { rhs };
+                        let ne_0 = target.tot_ne_kernel_broadcast(&T::Native::zero());
+                        let validity = combine_validities_and(target.validity(), Some(&ne_0));
+                        target.set_validity(validity);
+                    },
+                    _ => {},
                 }
-            },
+            }
+        }
+
+        /// For list<->primitive where the primitive is broadcasted, we can dispatch to
+        /// `ArithmeticKernel`, which can have optimized codepaths for when one side is
+        /// a scalar.
+        fn apply_array_to_scalar<T: PolarsNumericType>(
+            &self,
+            arr_lhs: PrimitiveArray<T::Native>,
+            r: T::Native,
+            swapped: bool,
+        ) -> PrimitiveArray<T::Native> {
+            match self {
+                Self::Add => ArithmeticKernel::wrapping_add_scalar(arr_lhs, r),
+                Self::Sub => {
+                    if swapped {
+                        ArithmeticKernel::wrapping_sub_scalar_lhs(r, arr_lhs)
+                    } else {
+                        ArithmeticKernel::wrapping_sub_scalar(arr_lhs, r)
+                    }
+                },
+                Self::Mul => ArithmeticKernel::wrapping_mul_scalar(arr_lhs, r),
+                Self::Div => {
+                    if swapped {
+                        ArithmeticKernel::legacy_div_scalar_lhs(r, arr_lhs)
+                    } else {
+                        ArithmeticKernel::legacy_div_scalar(arr_lhs, r)
+                    }
+                },
+                Self::Rem => {
+                    if swapped {
+                        ArithmeticKernel::wrapping_mod_scalar_lhs(r, arr_lhs)
+                    } else {
+                        ArithmeticKernel::wrapping_mod_scalar(arr_lhs, r)
+                    }
+                },
+                Self::FloorDiv => {
+                    if swapped {
+                        ArithmeticKernel::wrapping_floor_div_scalar_lhs(r, arr_lhs)
+                    } else {
+                        ArithmeticKernel::wrapping_floor_div_scalar(arr_lhs, r)
+                    }
+                },
+            }
         }
     }
-}
 
-macro_rules! with_match_numeric_list_op {
+    macro_rules! with_match_numeric_list_op {
     ($op:expr, $swapped:expr, | $_:tt $OP:tt | $($body:tt)* ) => ({
         macro_rules! __with_func__ {( $_ $OP:tt ) => ( $($body)* )}
 
@@ -213,814 +231,826 @@ macro_rules! with_match_numeric_list_op {
     })
 }
 
-#[derive(Debug)]
-enum BinaryOpApplyType {
-    ListToList,
-    ListToPrimitive,
-    PrimitiveToList,
-}
-
-#[derive(Debug)]
-enum Broadcast {
-    Left,
-    Right,
-    #[allow(clippy::enum_variant_names)]
-    NoBroadcast,
-}
+    #[derive(Debug)]
+    enum BinaryOpApplyType {
+        ListToList,
+        ListToPrimitive,
+        PrimitiveToList,
+    }
 
-/// Utility to perform a binary operation between the primitive values of
-/// 2 columns, where at least one of the columns is a `ListChunked` type.
-struct BinaryListNumericOpHelper {
-    op: NumericListOp,
-    output_name: PlSmallStr,
-    op_apply_type: BinaryOpApplyType,
-    broadcast: Broadcast,
-    output_dtype: DataType,
-    output_primitive_dtype: DataType,
-    output_len: usize,
-    /// Outer validity of the result, we always materialize this to reduce the
-    /// amount of code paths we need.
-    outer_validity: Bitmap,
-    // The series are stored as they are used for list broadcasting.
-    data_lhs: (Vec<OffsetsBuffer<i64>>, Vec<Option<Bitmap>>, Series),
-    data_rhs: (Vec<OffsetsBuffer<i64>>, Vec<Option<Bitmap>>, Series),
-    list_to_prim_lhs: Option<(Box<dyn Array>, usize)>,
-    swapped: bool,
-}
+    #[derive(Debug)]
+    enum Broadcast {
+        Left,
+        Right,
+        #[allow(clippy::enum_variant_names)]
+        NoBroadcast,
+    }
 
-/// This lets us separate some logic into `new()` to reduce the amount of
-/// monomorphized code.
-impl BinaryListNumericOpHelper {
-    /// Checks that:
-    /// * Dtypes are compatible:
-    ///   * list<->primitive | primitive<->list
-    ///   * list<->list both contain primitives (e.g. List<Int8>)
-    /// * Primitive dtypes match
-    /// * Lengths are compatible:
-    ///   * 1<->n | n<->1
-    ///   * n<->n
-    /// * Both sides have at least 1 non-NULL outer row.
-    ///
-    /// Does not check:
-    /// * Whether the offsets are aligned for list<->list, this will be checked during execution.
-    ///
-    /// This returns an `Either` which may contain the final result to simplify
-    /// the implementation.
-    #[allow(clippy::too_many_arguments)]
-    fn try_new(
+    /// Utility to perform a binary operation between the primitive values of
+    /// 2 columns, where at least one of the columns is a `ListChunked` type.
+    pub(super) struct BinaryListNumericOpHelper {
         op: NumericListOp,
         output_name: PlSmallStr,
-        dtype_lhs: &DataType,
-        dtype_rhs: &DataType,
-        len_lhs: usize,
-        len_rhs: usize,
+        op_apply_type: BinaryOpApplyType,
+        broadcast: Broadcast,
+        output_dtype: DataType,
+        output_primitive_dtype: DataType,
+        output_len: usize,
+        /// Outer validity of the result, we always materialize this to reduce the
+        /// amount of code paths we need.
+        outer_validity: Bitmap,
+        // The series are stored as they are used for list broadcasting.
         data_lhs: (Vec<OffsetsBuffer<i64>>, Vec<Option<Bitmap>>, Series),
         data_rhs: (Vec<OffsetsBuffer<i64>>, Vec<Option<Bitmap>>, Series),
-        validity_lhs: Option<Bitmap>,
-        validity_rhs: Option<Bitmap>,
-    ) -> PolarsResult<Either<Self, ListChunked>> {
-        let prim_dtype_lhs = dtype_lhs.leaf_dtype();
-        let prim_dtype_rhs = dtype_rhs.leaf_dtype();
-
-        let output_primitive_dtype = op.try_get_leaf_supertype(prim_dtype_lhs, prim_dtype_rhs)?;
-
-        let (op_apply_type, output_dtype) = match (dtype_lhs, dtype_rhs) {
-            (l @ DataType::List(a), r @ DataType::List(b)) => {
-                // `get_arithmetic_field()` in the DSL checks this, but we also have to check here because if a user
-                // directly adds 2 series together it bypasses the DSL.
-                // This is currently duplicated code and should be replaced one day with an assert after Series ops get
-                // checked properly.
-                if ![a, b]
-                    .into_iter()
-                    .all(|x| x.is_numeric() || x.is_bool() || x.is_null())
+        list_to_prim_lhs: Option<(Box<dyn Array>, usize)>,
+        swapped: bool,
+    }
+
+    /// This lets us separate some logic into `new()` to reduce the amount of
+    /// monomorphized code.
+    impl BinaryListNumericOpHelper {
+        /// Checks that:
+        /// * Dtypes are compatible:
+        ///   * list<->primitive | primitive<->list
+        ///   * list<->list both contain primitives (e.g. List<Int8>)
+        /// * Primitive dtypes match
+        /// * Lengths are compatible:
+        ///   * 1<->n | n<->1
+        ///   * n<->n
+        /// * Both sides have at least 1 non-NULL outer row.
+        ///
+        /// Does not check:
+        /// * Whether the offsets are aligned for list<->list, this will be checked during execution.
+        ///
+        /// This returns an `Either` which may contain the final result to simplify
+        /// the implementation.
+        #[allow(clippy::too_many_arguments)]
+        pub(super) fn try_new(
+            op: NumericListOp,
+            output_name: PlSmallStr,
+            dtype_lhs: &DataType,
+            dtype_rhs: &DataType,
+            len_lhs: usize,
+            len_rhs: usize,
+            data_lhs: (Vec<OffsetsBuffer<i64>>, Vec<Option<Bitmap>>, Series),
+            data_rhs: (Vec<OffsetsBuffer<i64>>, Vec<Option<Bitmap>>, Series),
+            validity_lhs: Option<Bitmap>,
+            validity_rhs: Option<Bitmap>,
+        ) -> PolarsResult<Either<Self, ListChunked>> {
+            let prim_dtype_lhs = dtype_lhs.leaf_dtype();
+            let prim_dtype_rhs = dtype_rhs.leaf_dtype();
+
+            let output_primitive_dtype =
+                op.try_get_leaf_supertype(prim_dtype_lhs, prim_dtype_rhs)?;
+
+            let (op_apply_type, output_dtype) = match (dtype_lhs, dtype_rhs) {
+                (l @ DataType::List(a), r @ DataType::List(b)) => {
+                    // `get_arithmetic_field()` in the DSL checks this, but we also have to check here because if a user
+                    // directly adds 2 series together it bypasses the DSL.
+                    // This is currently duplicated code and should be replaced one day with an assert after Series ops get
+                    // checked properly.
+                    if ![a, b]
+                        .into_iter()
+                        .all(|x| x.is_numeric() || x.is_bool() || x.is_null())
+                    {
+                        polars_bail!(
+                            InvalidOperation:
+                            "cannot {} two list columns with non-numeric inner types: (left: {}, right: {})",
+                            op.name(), l, r,
+                        );
+                    }
+                    (BinaryOpApplyType::ListToList, l)
+                },
+                (list_dtype @ DataType::List(_), x)
+                    if x.is_numeric() || x.is_bool() || x.is_null() =>
                 {
-                    polars_bail!(
-                        InvalidOperation:
-                        "cannot {} two list columns with non-numeric inner types: (left: {}, right: {})",
-                        op.name(), l, r,
-                    );
-                }
-                (BinaryOpApplyType::ListToList, l)
-            },
-            (list_dtype @ DataType::List(_), x) if x.is_numeric() || x.is_bool() || x.is_null() => {
-                (BinaryOpApplyType::ListToPrimitive, list_dtype)
-            },
-            (x, list_dtype @ DataType::List(_)) if x.is_numeric() || x.is_bool() || x.is_null() => {
-                (BinaryOpApplyType::PrimitiveToList, list_dtype)
-            },
-            (l, r) => polars_bail!(
-                InvalidOperation:
-                "{} operation not supported for dtypes: {} != {}",
-                op.name(), l, r,
-            ),
-        };
-
-        let output_dtype = output_dtype.cast_leaf(output_primitive_dtype.clone());
-
-        let (broadcast, output_len) = match (len_lhs, len_rhs) {
-            (l, r) if l == r => (Broadcast::NoBroadcast, l),
-            (1, v) => (Broadcast::Left, v),
-            (v, 1) => (Broadcast::Right, v),
-            (l, r) => polars_bail!(
-                ShapeMismatch:
-                "cannot {} two columns of differing lengths: {} != {}",
-                op.name(), l, r
-            ),
-        };
-
-        let DataType::List(output_inner_dtype) = &output_dtype else {
-            unreachable!()
-        };
-
-        // # NULL semantics
-        // * [[1, 2]] (List[List[Int64]]) + NULL (Int64) => [[NULL, NULL]]
-        //   * Essentially as if the NULL primitive was added to every primitive in the row of the list column.
-        // * NULL (List[Int64]) + 1   (Int64)       => NULL
-        // * NULL (List[Int64]) + [1] (List[Int64]) => NULL
-
-        if output_len == 0
-            || (len_lhs == 1
-                && matches!(
-                    &op_apply_type,
-                    BinaryOpApplyType::ListToList | BinaryOpApplyType::ListToPrimitive
-                )
-                && validity_lhs.as_ref().map_or(false, |x| {
-                    !x.get_bit(0) // is not valid
-                }))
-            || (len_rhs == 1
-                && matches!(
-                    &op_apply_type,
-                    BinaryOpApplyType::ListToList | BinaryOpApplyType::PrimitiveToList
+                    (BinaryOpApplyType::ListToPrimitive, list_dtype)
+                },
+                (x, list_dtype @ DataType::List(_))
+                    if x.is_numeric() || x.is_bool() || x.is_null() =>
+                {
+                    (BinaryOpApplyType::PrimitiveToList, list_dtype)
+                },
+                (l, r) => polars_bail!(
+                    InvalidOperation:
+                    "{} operation not supported for dtypes: {} != {}",
+                    op.name(), l, r,
+                ),
+            };
+
+            let output_dtype = output_dtype.cast_leaf(output_primitive_dtype.clone());
+
+            let (broadcast, output_len) = match (len_lhs, len_rhs) {
+                (l, r) if l == r => (Broadcast::NoBroadcast, l),
+                (1, v) => (Broadcast::Left, v),
+                (v, 1) => (Broadcast::Right, v),
+                (l, r) => polars_bail!(
+                    ShapeMismatch:
+                    "cannot {} two columns of differing lengths: {} != {}",
+                    op.name(), l, r
+                ),
+            };
+
+            let DataType::List(output_inner_dtype) = &output_dtype else {
+                unreachable!()
+            };
+
+            // # NULL semantics
+            // * [[1, 2]] (List[List[Int64]]) + NULL (Int64) => [[NULL, NULL]]
+            //   * Essentially as if the NULL primitive was added to every primitive in the row of the list column.
+            // * NULL (List[Int64]) + 1   (Int64)       => NULL
+            // * NULL (List[Int64]) + [1] (List[Int64]) => NULL
+
+            if output_len == 0
+                || (len_lhs == 1
+                    && matches!(
+                        &op_apply_type,
+                        BinaryOpApplyType::ListToList | BinaryOpApplyType::ListToPrimitive
+                    )
+                    && validity_lhs.as_ref().map_or(false, |x| {
+                        !x.get_bit(0) // is not valid
+                    }))
+                || (len_rhs == 1
+                    && matches!(
+                        &op_apply_type,
+                        BinaryOpApplyType::ListToList | BinaryOpApplyType::PrimitiveToList
+                    )
+                    && validity_rhs.as_ref().map_or(false, |x| {
+                        !x.get_bit(0) // is not valid
+                    }))
+            {
+                return Ok(Either::Right(ListChunked::full_null_with_dtype(
+                    output_name.clone(),
+                    output_len,
+                    output_inner_dtype.as_ref(),
+                )));
+            }
+
+            // At this point:
+            // * All unit length list columns have a valid outer value.
+
+            // The outer validity is just the validity of any non-broadcasting lists.
+            let outer_validity = match (&op_apply_type, &broadcast, validity_lhs, validity_rhs) {
+                // Both lists with same length, we combine the validity.
+                (BinaryOpApplyType::ListToList, Broadcast::NoBroadcast, l, r) => {
+                    combine_validities_and(l.as_ref(), r.as_ref())
+                },
+                // Match all other combinations that have non-broadcasting lists.
+                (
+                    BinaryOpApplyType::ListToList | BinaryOpApplyType::ListToPrimitive,
+                    Broadcast::NoBroadcast | Broadcast::Right,
+                    v,
+                    _,
                 )
-                && validity_rhs.as_ref().map_or(false, |x| {
-                    !x.get_bit(0) // is not valid
-                }))
-        {
-            return Ok(Either::Right(ListChunked::full_null_with_dtype(
-                output_name.clone(),
+                | (
+                    BinaryOpApplyType::ListToList | BinaryOpApplyType::PrimitiveToList,
+                    Broadcast::NoBroadcast | Broadcast::Left,
+                    _,
+                    v,
+                ) => v,
+                _ => None,
+            }
+            .unwrap_or_else(|| Bitmap::new_with_value(true, output_len));
+
+            Ok(Either::Left(Self {
+                op,
+                output_name,
+                op_apply_type,
+                broadcast,
+                output_dtype: output_dtype.clone(),
+                output_primitive_dtype,
                 output_len,
-                output_inner_dtype.as_ref(),
-            )));
+                outer_validity,
+                data_lhs,
+                data_rhs,
+                list_to_prim_lhs: None,
+                swapped: false,
+            }))
         }
 
-        // At this point:
-        // * All unit length list columns have a valid outer value.
-
-        // The outer validity is just the validity of any non-broadcasting lists.
-        let outer_validity = match (&op_apply_type, &broadcast, validity_lhs, validity_rhs) {
-            // Both lists with same length, we combine the validity.
-            (BinaryOpApplyType::ListToList, Broadcast::NoBroadcast, l, r) => {
-                combine_validities_and(l.as_ref(), r.as_ref())
-            },
-            // Match all other combinations that have non-broadcasting lists.
-            (
-                BinaryOpApplyType::ListToList | BinaryOpApplyType::ListToPrimitive,
-                Broadcast::NoBroadcast | Broadcast::Right,
-                v,
-                _,
-            )
-            | (
-                BinaryOpApplyType::ListToList | BinaryOpApplyType::PrimitiveToList,
-                Broadcast::NoBroadcast | Broadcast::Left,
-                _,
-                v,
-            ) => v,
-            _ => None,
-        }
-        .unwrap_or_else(|| Bitmap::new_with_value(true, output_len));
-
-        Ok(Either::Left(Self {
-            op,
-            output_name,
-            op_apply_type,
-            broadcast,
-            output_dtype: output_dtype.clone(),
-            output_primitive_dtype,
-            output_len,
-            outer_validity,
-            data_lhs,
-            data_rhs,
-            list_to_prim_lhs: None,
-            swapped: false,
-        }))
-    }
+        pub(super) fn finish(mut self) -> PolarsResult<ListChunked> {
+            // We have physical codepaths for a subset of the possible combinations of broadcasting and
+            // column types. The remaining combinations are handled by dispatching to the physical
+            // codepaths after operand swapping and/or materialized broadcasting.
+            //
+            // # Physical impl table
+            // Legend
+            // * |  N  | // impl "N"
+            // * | [N] | // dispatches to impl "N"
+            //
+            //                  |  L  |  N  |  R  | // Broadcast (L)eft, (N)oBroadcast, (R)ight
+            // ListToList       | [1] |  0  |  1  |
+            // ListToPrimitive  | [2] |  2  |  3  | // list broadcasting just materializes and dispatches to NoBroadcast
+            // PrimitiveToList  | [3] | [2] | [2] |
+
+            self.swapped = true;
+
+            match (&self.op_apply_type, &self.broadcast) {
+                (BinaryOpApplyType::ListToList, Broadcast::NoBroadcast)
+                | (BinaryOpApplyType::ListToList, Broadcast::Right)
+                | (BinaryOpApplyType::ListToPrimitive, Broadcast::NoBroadcast)
+                | (BinaryOpApplyType::ListToPrimitive, Broadcast::Right) => {
+                    self.swapped = false;
+                    self._finish_impl_dispatch()
+                },
+                (BinaryOpApplyType::PrimitiveToList, Broadcast::Right) => {
+                    // We materialize the list columns with `new_from_index`, as otherwise we'd have to
+                    // implement logic that broadcasts the offsets and validities across multiple levels
+                    // of nesting. But we will re-use the materialized memory to store the result.
+
+                    self.list_to_prim_lhs
+                        .replace(Self::materialize_broadcasted_list(
+                            &mut self.data_rhs,
+                            self.output_len,
+                            &self.output_primitive_dtype,
+                        ));
+
+                    self.op_apply_type = BinaryOpApplyType::ListToPrimitive;
+                    self.broadcast = Broadcast::NoBroadcast;
+                    core::mem::swap(&mut self.data_lhs, &mut self.data_rhs);
+
+                    self._finish_impl_dispatch()
+                },
+                (BinaryOpApplyType::ListToList, Broadcast::Left) => {
+                    self.broadcast = Broadcast::Right;
 
-    fn finish(mut self) -> PolarsResult<ListChunked> {
-        // We have physical codepaths for a subset of the possible combinations of broadcasting and
-        // column types. The remaining combinations are handled by dispatching to the physical
-        // codepaths after operand swapping and/or materialized broadcasting.
-        //
-        // # Physical impl table
-        // Legend
-        // * |  N  | // impl "N"
-        // * | [N] | // dispatches to impl "N"
-        //
-        //                  |  L  |  N  |  R  | // Broadcast (L)eft, (N)oBroadcast, (R)ight
-        // ListToList       | [1] |  0  |  1  |
-        // ListToPrimitive  | [2] |  2  |  3  | // list broadcasting just materializes and dispatches to NoBroadcast
-        // PrimitiveToList  | [3] | [2] | [2] |
-
-        self.swapped = true;
-
-        match (&self.op_apply_type, &self.broadcast) {
-            (BinaryOpApplyType::ListToList, Broadcast::NoBroadcast)
-            | (BinaryOpApplyType::ListToList, Broadcast::Right)
-            | (BinaryOpApplyType::ListToPrimitive, Broadcast::NoBroadcast)
-            | (BinaryOpApplyType::ListToPrimitive, Broadcast::Right) => {
-                self.swapped = false;
-                self._finish_impl_dispatch()
-            },
-            (BinaryOpApplyType::PrimitiveToList, Broadcast::Right) => {
-                // We materialize the list columns with `new_from_index`, as otherwise we'd have to
-                // implement logic that broadcasts the offsets and validities across multiple levels
-                // of nesting. But we will re-use the materialized memory to store the result.
-
-                self.list_to_prim_lhs
-                    .replace(Self::materialize_broadcasted_list(
-                        &mut self.data_rhs,
-                        self.output_len,
-                        &self.output_primitive_dtype,
-                    ));
-
-                self.op_apply_type = BinaryOpApplyType::ListToPrimitive;
-                self.broadcast = Broadcast::NoBroadcast;
-                core::mem::swap(&mut self.data_lhs, &mut self.data_rhs);
-
-                self._finish_impl_dispatch()
-            },
-            (BinaryOpApplyType::ListToList, Broadcast::Left) => {
-                self.broadcast = Broadcast::Right;
+                    core::mem::swap(&mut self.data_lhs, &mut self.data_rhs);
 
-                core::mem::swap(&mut self.data_lhs, &mut self.data_rhs);
+                    self._finish_impl_dispatch()
+                },
+                (BinaryOpApplyType::ListToPrimitive, Broadcast::Left) => {
+                    self.list_to_prim_lhs
+                        .replace(Self::materialize_broadcasted_list(
+                            &mut self.data_lhs,
+                            self.output_len,
+                            &self.output_primitive_dtype,
+                        ));
+
+                    self.broadcast = Broadcast::NoBroadcast;
+
+                    // This does not swap! We are just dispatching to `NoBroadcast`
+                    // after materializing the broadcasted list array.
+                    self.swapped = false;
+                    self._finish_impl_dispatch()
+                },
+                (BinaryOpApplyType::PrimitiveToList, Broadcast::Left) => {
+                    self.op_apply_type = BinaryOpApplyType::ListToPrimitive;
+                    self.broadcast = Broadcast::Right;
 
-                self._finish_impl_dispatch()
-            },
-            (BinaryOpApplyType::ListToPrimitive, Broadcast::Left) => {
-                self.list_to_prim_lhs
-                    .replace(Self::materialize_broadcasted_list(
-                        &mut self.data_lhs,
-                        self.output_len,
-                        &self.output_primitive_dtype,
-                    ));
-
-                self.broadcast = Broadcast::NoBroadcast;
-
-                // This does not swap! We are just dispatching to `NoBroadcast`
-                // after materializing the broadcasted list array.
-                self.swapped = false;
-                self._finish_impl_dispatch()
-            },
-            (BinaryOpApplyType::PrimitiveToList, Broadcast::Left) => {
-                self.op_apply_type = BinaryOpApplyType::ListToPrimitive;
-                self.broadcast = Broadcast::Right;
+                    core::mem::swap(&mut self.data_lhs, &mut self.data_rhs);
 
-                core::mem::swap(&mut self.data_lhs, &mut self.data_rhs);
+                    self._finish_impl_dispatch()
+                },
+                (BinaryOpApplyType::PrimitiveToList, Broadcast::NoBroadcast) => {
+                    self.op_apply_type = BinaryOpApplyType::ListToPrimitive;
 
-                self._finish_impl_dispatch()
-            },
-            (BinaryOpApplyType::PrimitiveToList, Broadcast::NoBroadcast) => {
-                self.op_apply_type = BinaryOpApplyType::ListToPrimitive;
+                    core::mem::swap(&mut self.data_lhs, &mut self.data_rhs);
 
-                core::mem::swap(&mut self.data_lhs, &mut self.data_rhs);
+                    self._finish_impl_dispatch()
+                },
+            }
+        }
 
-                self._finish_impl_dispatch()
-            },
+        fn _finish_impl_dispatch(&mut self) -> PolarsResult<ListChunked> {
+            let output_dtype = self.output_dtype.clone();
+            let output_len = self.output_len;
+
+            let prim_lhs = self
+                .data_lhs
+                .2
+                .get_leaf_array()
+                .cast(&self.output_primitive_dtype)?
+                .rechunk();
+            let prim_rhs = self
+                .data_rhs
+                .2
+                .get_leaf_array()
+                .cast(&self.output_primitive_dtype)?
+                .rechunk();
+
+            debug_assert_eq!(prim_lhs.dtype(), prim_rhs.dtype());
+            let prim_dtype = prim_lhs.dtype();
+            debug_assert_eq!(prim_dtype, &self.output_primitive_dtype);
+
+            // Safety: Leaf dtypes have been checked to be numeric by `try_new()`
+            let out = with_match_physical_numeric_polars_type!(&prim_dtype, |$T| {
+                self._finish_impl::<$T>(prim_lhs, prim_rhs)
+            })?;
+
+            debug_assert_eq!(out.dtype(), &output_dtype);
+            assert_eq!(out.len(), output_len);
+
+            Ok(out)
         }
-    }
 
-    fn _finish_impl_dispatch(&mut self) -> PolarsResult<ListChunked> {
-        let output_dtype = self.output_dtype.clone();
-        let output_len = self.output_len;
-
-        let prim_lhs = self
-            .data_lhs
-            .2
-            .get_leaf_array()
-            .cast(&self.output_primitive_dtype)?
-            .rechunk();
-        let prim_rhs = self
-            .data_rhs
-            .2
-            .get_leaf_array()
-            .cast(&self.output_primitive_dtype)?
-            .rechunk();
-
-        debug_assert_eq!(prim_lhs.dtype(), prim_rhs.dtype());
-        let prim_dtype = prim_lhs.dtype();
-        debug_assert_eq!(prim_dtype, &self.output_primitive_dtype);
-
-        // Safety: Leaf dtypes have been checked to be numeric by `try_new()`
-        let out = with_match_physical_numeric_polars_type!(&prim_dtype, |$T| {
-            self._finish_impl::<$T>(prim_lhs, prim_rhs)
-        })?;
-
-        debug_assert_eq!(out.dtype(), &output_dtype);
-        assert_eq!(out.len(), output_len);
-
-        Ok(out)
-    }
+        /// Internal use only - contains physical impls.
+        fn _finish_impl<T: PolarsNumericType>(
+            &mut self,
+            prim_s_lhs: Series,
+            prim_s_rhs: Series,
+        ) -> PolarsResult<ListChunked>
+        where
+            T::Native: PlNumArithmetic,
+            PrimitiveArray<T::Native>:
+                polars_compute::comparisons::TotalEqKernel<Scalar = T::Native>,
+            T::Native: Zero + IsFloat,
+        {
+            #[inline(never)]
+            fn check_mismatch_pos(
+                mismatch_pos: usize,
+                offsets_lhs: &OffsetsBuffer<i64>,
+                offsets_rhs: &OffsetsBuffer<i64>,
+            ) -> PolarsResult<()> {
+                if mismatch_pos < offsets_lhs.len_proxy() {
+                    // RHS could be broadcasted
+                    let len_r = offsets_rhs.length_at(if offsets_rhs.len_proxy() == 1 {
+                        0
+                    } else {
+                        mismatch_pos
+                    });
+                    polars_bail!(
+                        ShapeMismatch:
+                        "list lengths differed at index {}: {} != {}",
+                        mismatch_pos,
+                        offsets_lhs.length_at(mismatch_pos), len_r
+                    )
+                }
+                Ok(())
+            }
 
-    /// Internal use only - contains physical impls.
-    fn _finish_impl<T: PolarsNumericType>(
-        &mut self,
-        prim_s_lhs: Series,
-        prim_s_rhs: Series,
-    ) -> PolarsResult<ListChunked>
-    where
-        T::Native: PlNumArithmetic,
-        PrimitiveArray<T::Native>: polars_compute::comparisons::TotalEqKernel<Scalar = T::Native>,
-        T::Native: Zero + IsFloat,
-    {
-        #[inline(never)]
-        fn check_mismatch_pos(
-            mismatch_pos: usize,
-            offsets_lhs: &OffsetsBuffer<i64>,
-            offsets_rhs: &OffsetsBuffer<i64>,
-        ) -> PolarsResult<()> {
-            if mismatch_pos < offsets_lhs.len_proxy() {
-                // RHS could be broadcasted
-                let len_r = offsets_rhs.length_at(if offsets_rhs.len_proxy() == 1 {
-                    0
-                } else {
-                    mismatch_pos
-                });
-                polars_bail!(
-                    ShapeMismatch:
-                    "list lengths differed at index {}: {} != {}",
-                    mismatch_pos,
-                    offsets_lhs.length_at(mismatch_pos), len_r
-                )
+            let mut arr_lhs = {
+                let ca: &ChunkedArray<T> = prim_s_lhs.as_ref().as_ref();
+                assert_eq!(ca.chunks().len(), 1);
+                ca.downcast_get(0).unwrap().clone()
+            };
+
+            let mut arr_rhs = {
+                let ca: &ChunkedArray<T> = prim_s_rhs.as_ref().as_ref();
+                assert_eq!(ca.chunks().len(), 1);
+                ca.downcast_get(0).unwrap().clone()
+            };
+
+            match (&self.op_apply_type, &self.broadcast) {
+                // We skip for this because it dispatches to `ArithmeticKernel`, which handles the
+                // validities for us.
+                (BinaryOpApplyType::ListToPrimitive, Broadcast::Right) => {},
+                _ if self.list_to_prim_lhs.is_none() => {
+                    self.op.prepare_numeric_op_side_validities::<T>(
+                        &mut arr_lhs,
+                        &mut arr_rhs,
+                        self.swapped,
+                    )
+                },
+                (BinaryOpApplyType::ListToPrimitive, Broadcast::NoBroadcast) => {},
+                _ => unreachable!(),
             }
-            Ok(())
-        }
 
-        let mut arr_lhs = {
-            let ca: &ChunkedArray<T> = prim_s_lhs.as_ref().as_ref();
-            assert_eq!(ca.chunks().len(), 1);
-            ca.downcast_get(0).unwrap().clone()
-        };
-
-        let mut arr_rhs = {
-            let ca: &ChunkedArray<T> = prim_s_rhs.as_ref().as_ref();
-            assert_eq!(ca.chunks().len(), 1);
-            ca.downcast_get(0).unwrap().clone()
-        };
-
-        match (&self.op_apply_type, &self.broadcast) {
-            // We skip for this because it dispatches to `ArithmeticKernel`, which handles the
-            // validities for us.
-            (BinaryOpApplyType::ListToPrimitive, Broadcast::Right) => {},
-            _ if self.list_to_prim_lhs.is_none() => self
-                .op
-                .prepare_numeric_op_side_validities::<T>(&mut arr_lhs, &mut arr_rhs, self.swapped),
-            (BinaryOpApplyType::ListToPrimitive, Broadcast::NoBroadcast) => {},
-            _ => unreachable!(),
-        }
+            //
+            // General notes
+            // * Lists can be:
+            //   * Sliced, in which case the primitive/leaf array needs to be indexed starting from an
+            //     offset instead of 0.
+            //   * Masked, in which case the masked rows are permitted to have non-matching widths.
+            //
 
-        //
-        // General notes
-        // * Lists can be:
-        //   * Sliced, in which case the primitive/leaf array needs to be indexed starting from an
-        //     offset instead of 0.
-        //   * Masked, in which case the masked rows are permitted to have non-matching widths.
-        //
-
-        let out = match (&self.op_apply_type, &self.broadcast) {
-            (BinaryOpApplyType::ListToList, Broadcast::NoBroadcast) => {
-                let offsets_lhs = &self.data_lhs.0[0];
-                let offsets_rhs = &self.data_rhs.0[0];
-
-                assert_eq!(offsets_lhs.len_proxy(), offsets_rhs.len_proxy());
-
-                // Output primitive (and optional validity) are aligned to the LHS input.
-                let n_values = arr_lhs.len();
-                let mut out_vec: Vec<T::Native> = Vec::with_capacity(n_values);
-                let out_ptr: *mut T::Native = out_vec.as_mut_ptr();
-
-                // Counter that stops being incremented at the first row position with mismatching
-                // list lengths.
-                let mut mismatch_pos = 0;
-
-                with_match_numeric_list_op!(&self.op, self.swapped, |$OP| {
-                    for (i, ((lhs_start, lhs_len), (rhs_start, rhs_len))) in offsets_lhs
-                        .offset_and_length_iter()
-                        .zip(offsets_rhs.offset_and_length_iter())
-                        .enumerate()
-                    {
-                        if
-                            (mismatch_pos == i)
-                            & (
-                                (lhs_len == rhs_len)
-                                | unsafe { !self.outer_validity.get_bit_unchecked(i) }
-                            )
-                        {
-                            mismatch_pos += 1;
-                        }
+            let out = match (&self.op_apply_type, &self.broadcast) {
+                (BinaryOpApplyType::ListToList, Broadcast::NoBroadcast) => {
+                    let offsets_lhs = &self.data_lhs.0[0];
+                    let offsets_rhs = &self.data_rhs.0[0];
 
-                        // Both sides are lists, we restrict the index to the min length to avoid
-                        // OOB memory access.
-                        let len: usize = lhs_len.min(rhs_len);
+                    assert_eq!(offsets_lhs.len_proxy(), offsets_rhs.len_proxy());
 
-                        for i in 0..len {
-                            let l_idx = i + lhs_start;
-                            let r_idx = i + rhs_start;
+                    // Output primitive (and optional validity) are aligned to the LHS input.
+                    let n_values = arr_lhs.len();
+                    let mut out_vec: Vec<T::Native> = Vec::with_capacity(n_values);
+                    let out_ptr: *mut T::Native = out_vec.as_mut_ptr();
 
-                            let l = unsafe { arr_lhs.value_unchecked(l_idx) };
-                            let r = unsafe { arr_rhs.value_unchecked(r_idx) };
-                            let v = $OP(l, r);
+                    // Counter that stops being incremented at the first row position with mismatching
+                    // list lengths.
+                    let mut mismatch_pos = 0;
 
-                            unsafe { out_ptr.add(l_idx).write(v) };
-                        }
-                    }
-                });
-
-                check_mismatch_pos(mismatch_pos, offsets_lhs, offsets_rhs)?;
-
-                unsafe { out_vec.set_len(n_values) };
-
-                /// Reduce monomorphization
-                #[inline(never)]
-                fn combine_validities_list_to_list_no_broadcast(
-                    offsets_lhs: &OffsetsBuffer<i64>,
-                    offsets_rhs: &OffsetsBuffer<i64>,
-                    validity_lhs: Option<&Bitmap>,
-                    validity_rhs: Option<&Bitmap>,
-                    len_lhs: usize,
-                ) -> Option<Bitmap> {
-                    match (validity_lhs, validity_rhs) {
-                        (Some(l), Some(r)) => Some((l.clone().make_mut(), r)),
-                        (Some(v), None) => return Some(v.clone()),
-                        (None, Some(v)) => {
-                            Some((Bitmap::new_with_value(true, len_lhs).make_mut(), v))
-                        },
-                        (None, None) => None,
-                    }
-                    .map(|(mut validity_out, validity_rhs)| {
-                        for ((lhs_start, lhs_len), (rhs_start, rhs_len)) in offsets_lhs
+                    with_match_numeric_list_op!(&self.op, self.swapped, |$OP| {
+                        for (i, ((lhs_start, lhs_len), (rhs_start, rhs_len))) in offsets_lhs
                             .offset_and_length_iter()
                             .zip(offsets_rhs.offset_and_length_iter())
+                            .enumerate()
                         {
+                            if
+                                (mismatch_pos == i)
+                                & (
+                                    (lhs_len == rhs_len)
+                                    | unsafe { !self.outer_validity.get_bit_unchecked(i) }
+                                )
+                            {
+                                mismatch_pos += 1;
+                            }
+
+                            // Both sides are lists, we restrict the index to the min length to avoid
+                            // OOB memory access.
                             let len: usize = lhs_len.min(rhs_len);
 
                             for i in 0..len {
                                 let l_idx = i + lhs_start;
                                 let r_idx = i + rhs_start;
 
-                                let l_valid = unsafe { validity_out.get_unchecked(l_idx) };
-                                let r_valid = unsafe { validity_rhs.get_bit_unchecked(r_idx) };
-                                let is_valid = l_valid & r_valid;
+                                let l = unsafe { arr_lhs.value_unchecked(l_idx) };
+                                let r = unsafe { arr_rhs.value_unchecked(r_idx) };
+                                let v = $OP(l, r);
 
-                                // Size and alignment of validity vec are based on LHS.
-                                unsafe { validity_out.set_unchecked(l_idx, is_valid) };
+                                unsafe { out_ptr.add(l_idx).write(v) };
                             }
                         }
+                    });
+
+                    check_mismatch_pos(mismatch_pos, offsets_lhs, offsets_rhs)?;
+
+                    unsafe { out_vec.set_len(n_values) };
+
+                    /// Reduce monomorphization
+                    #[inline(never)]
+                    fn combine_validities_list_to_list_no_broadcast(
+                        offsets_lhs: &OffsetsBuffer<i64>,
+                        offsets_rhs: &OffsetsBuffer<i64>,
+                        validity_lhs: Option<&Bitmap>,
+                        validity_rhs: Option<&Bitmap>,
+                        len_lhs: usize,
+                    ) -> Option<Bitmap> {
+                        match (validity_lhs, validity_rhs) {
+                            (Some(l), Some(r)) => Some((l.clone().make_mut(), r)),
+                            (Some(v), None) => return Some(v.clone()),
+                            (None, Some(v)) => {
+                                Some((Bitmap::new_with_value(true, len_lhs).make_mut(), v))
+                            },
+                            (None, None) => None,
+                        }
+                        .map(|(mut validity_out, validity_rhs)| {
+                            for ((lhs_start, lhs_len), (rhs_start, rhs_len)) in offsets_lhs
+                                .offset_and_length_iter()
+                                .zip(offsets_rhs.offset_and_length_iter())
+                            {
+                                let len: usize = lhs_len.min(rhs_len);
+
+                                for i in 0..len {
+                                    let l_idx = i + lhs_start;
+                                    let r_idx = i + rhs_start;
+
+                                    let l_valid = unsafe { validity_out.get_unchecked(l_idx) };
+                                    let r_valid = unsafe { validity_rhs.get_bit_unchecked(r_idx) };
+                                    let is_valid = l_valid & r_valid;
+
+                                    // Size and alignment of validity vec are based on LHS.
+                                    unsafe { validity_out.set_unchecked(l_idx, is_valid) };
+                                }
+                            }
 
-                        validity_out.freeze()
-                    })
-                }
-
-                let leaf_validity = combine_validities_list_to_list_no_broadcast(
-                    offsets_lhs,
-                    offsets_rhs,
-                    arr_lhs.validity(),
-                    arr_rhs.validity(),
-                    arr_lhs.len(),
-                );
-
-                let arr =
-                    PrimitiveArray::<T::Native>::from_vec(out_vec).with_validity(leaf_validity);
-
-                let (offsets, validities, _) = core::mem::take(&mut self.data_lhs);
-                assert_eq!(offsets.len(), 1);
-
-                self.finish_offsets_and_validities(Box::new(arr), offsets, validities)
-            },
-            (BinaryOpApplyType::ListToList, Broadcast::Right) => {
-                let offsets_lhs = &self.data_lhs.0[0];
-                let offsets_rhs = &self.data_rhs.0[0];
+                            validity_out.freeze()
+                        })
+                    }
 
-                // Output primitive (and optional validity) are aligned to the LHS input.
-                let n_values = arr_lhs.len();
-                let mut out_vec: Vec<T::Native> = Vec::with_capacity(n_values);
-                let out_ptr: *mut T::Native = out_vec.as_mut_ptr();
+                    let leaf_validity = combine_validities_list_to_list_no_broadcast(
+                        offsets_lhs,
+                        offsets_rhs,
+                        arr_lhs.validity(),
+                        arr_rhs.validity(),
+                        arr_lhs.len(),
+                    );
 
-                assert_eq!(offsets_rhs.len_proxy(), 1);
-                let rhs_start = *offsets_rhs.first() as usize;
-                let width = offsets_rhs.range() as usize;
+                    let arr =
+                        PrimitiveArray::<T::Native>::from_vec(out_vec).with_validity(leaf_validity);
 
-                let mut mismatch_pos = 0;
+                    let (offsets, validities, _) = core::mem::take(&mut self.data_lhs);
+                    assert_eq!(offsets.len(), 1);
 
-                with_match_numeric_list_op!(&self.op, self.swapped, |$OP| {
-                    for (i, (lhs_start, lhs_len)) in offsets_lhs.offset_and_length_iter().enumerate() {
-                        if ((lhs_len == width) & (mismatch_pos == i))
-                            | unsafe { !self.outer_validity.get_bit_unchecked(i) }
-                        {
-                            mismatch_pos += 1;
-                        }
+                    self.finish_offsets_and_validities(Box::new(arr), offsets, validities)
+                },
+                (BinaryOpApplyType::ListToList, Broadcast::Right) => {
+                    let offsets_lhs = &self.data_lhs.0[0];
+                    let offsets_rhs = &self.data_rhs.0[0];
 
-                        let len: usize = lhs_len.min(width);
+                    // Output primitive (and optional validity) are aligned to the LHS input.
+                    let n_values = arr_lhs.len();
+                    let mut out_vec: Vec<T::Native> = Vec::with_capacity(n_values);
+                    let out_ptr: *mut T::Native = out_vec.as_mut_ptr();
 
-                        for i in 0..len {
-                            let l_idx = i + lhs_start;
-                            let r_idx = i + rhs_start;
+                    assert_eq!(offsets_rhs.len_proxy(), 1);
+                    let rhs_start = *offsets_rhs.first() as usize;
+                    let width = offsets_rhs.range() as usize;
 
-                            let l = unsafe { arr_lhs.value_unchecked(l_idx) };
-                            let r = unsafe { arr_rhs.value_unchecked(r_idx) };
-                            let v = $OP(l, r);
+                    let mut mismatch_pos = 0;
 
-                            unsafe {
-                                out_ptr.add(l_idx).write(v);
+                    with_match_numeric_list_op!(&self.op, self.swapped, |$OP| {
+                        for (i, (lhs_start, lhs_len)) in offsets_lhs.offset_and_length_iter().enumerate() {
+                            if ((lhs_len == width) & (mismatch_pos == i))
+                                | unsafe { !self.outer_validity.get_bit_unchecked(i) }
+                            {
+                                mismatch_pos += 1;
                             }
-                        }
-                    }
-                });
-
-                check_mismatch_pos(mismatch_pos, offsets_lhs, offsets_rhs)?;
-
-                unsafe { out_vec.set_len(n_values) };
-
-                #[inline(never)]
-                fn combine_validities_list_to_list_broadcast_right(
-                    offsets_lhs: &OffsetsBuffer<i64>,
-                    validity_lhs: Option<&Bitmap>,
-                    validity_rhs: Option<&Bitmap>,
-                    len_lhs: usize,
-                    width: usize,
-                    rhs_start: usize,
-                ) -> Option<Bitmap> {
-                    match (validity_lhs, validity_rhs) {
-                        (Some(l), Some(r)) => Some((l.clone().make_mut(), r)),
-                        (Some(v), None) => return Some(v.clone()),
-                        (None, Some(v)) => {
-                            Some((Bitmap::new_with_value(true, len_lhs).make_mut(), v))
-                        },
-                        (None, None) => None,
-                    }
-                    .map(|(mut validity_out, validity_rhs)| {
-                        for (lhs_start, lhs_len) in offsets_lhs.offset_and_length_iter() {
+
                             let len: usize = lhs_len.min(width);
 
                             for i in 0..len {
                                 let l_idx = i + lhs_start;
                                 let r_idx = i + rhs_start;
 
-                                let l_valid = unsafe { validity_out.get_unchecked(l_idx) };
-                                let r_valid = unsafe { validity_rhs.get_bit_unchecked(r_idx) };
-                                let is_valid = l_valid & r_valid;
+                                let l = unsafe { arr_lhs.value_unchecked(l_idx) };
+                                let r = unsafe { arr_rhs.value_unchecked(r_idx) };
+                                let v = $OP(l, r);
 
-                                // Size and alignment of validity vec are based on LHS.
-                                unsafe { validity_out.set_unchecked(l_idx, is_valid) };
+                                unsafe {
+                                    out_ptr.add(l_idx).write(v);
+                                }
                             }
                         }
+                    });
+
+                    check_mismatch_pos(mismatch_pos, offsets_lhs, offsets_rhs)?;
+
+                    unsafe { out_vec.set_len(n_values) };
+
+                    #[inline(never)]
+                    fn combine_validities_list_to_list_broadcast_right(
+                        offsets_lhs: &OffsetsBuffer<i64>,
+                        validity_lhs: Option<&Bitmap>,
+                        validity_rhs: Option<&Bitmap>,
+                        len_lhs: usize,
+                        width: usize,
+                        rhs_start: usize,
+                    ) -> Option<Bitmap> {
+                        match (validity_lhs, validity_rhs) {
+                            (Some(l), Some(r)) => Some((l.clone().make_mut(), r)),
+                            (Some(v), None) => return Some(v.clone()),
+                            (None, Some(v)) => {
+                                Some((Bitmap::new_with_value(true, len_lhs).make_mut(), v))
+                            },
+                            (None, None) => None,
+                        }
+                        .map(|(mut validity_out, validity_rhs)| {
+                            for (lhs_start, lhs_len) in offsets_lhs.offset_and_length_iter() {
+                                let len: usize = lhs_len.min(width);
 
-                        validity_out.freeze()
-                    })
-                }
-
-                let leaf_validity = combine_validities_list_to_list_broadcast_right(
-                    offsets_lhs,
-                    arr_lhs.validity(),
-                    arr_rhs.validity(),
-                    arr_lhs.len(),
-                    width,
-                    rhs_start,
-                );
+                                for i in 0..len {
+                                    let l_idx = i + lhs_start;
+                                    let r_idx = i + rhs_start;
 
-                let arr =
-                    PrimitiveArray::<T::Native>::from_vec(out_vec).with_validity(leaf_validity);
+                                    let l_valid = unsafe { validity_out.get_unchecked(l_idx) };
+                                    let r_valid = unsafe { validity_rhs.get_bit_unchecked(r_idx) };
+                                    let is_valid = l_valid & r_valid;
 
-                let (offsets, validities, _) = core::mem::take(&mut self.data_lhs);
-                assert_eq!(offsets.len(), 1);
+                                    // Size and alignment of validity vec are based on LHS.
+                                    unsafe { validity_out.set_unchecked(l_idx, is_valid) };
+                                }
+                            }
 
-                self.finish_offsets_and_validities(Box::new(arr), offsets, validities)
-            },
-            (BinaryOpApplyType::ListToPrimitive, Broadcast::NoBroadcast)
-                if self.list_to_prim_lhs.is_none() =>
-            {
-                let offsets_lhs = self.data_lhs.0.as_slice();
+                            validity_out.freeze()
+                        })
+                    }
 
-                // Notes
-                // * Primitive indexing starts from 0
-                // * Output is aligned to LHS array
+                    let leaf_validity = combine_validities_list_to_list_broadcast_right(
+                        offsets_lhs,
+                        arr_lhs.validity(),
+                        arr_rhs.validity(),
+                        arr_lhs.len(),
+                        width,
+                        rhs_start,
+                    );
 
-                let n_values = arr_lhs.len();
-                let mut out_vec = Vec::<T::Native>::with_capacity(n_values);
-                let out_ptr = out_vec.as_mut_ptr();
+                    let arr =
+                        PrimitiveArray::<T::Native>::from_vec(out_vec).with_validity(leaf_validity);
 
-                with_match_numeric_list_op!(&self.op, self.swapped, |$OP| {
-                    for (i, l_range) in OffsetsBuffer::<i64>::leaf_ranges_iter(offsets_lhs).enumerate()
-                    {
-                        let r = unsafe { arr_rhs.value_unchecked(i) };
-                        for l_idx in l_range {
-                            unsafe {
-                                let l = arr_lhs.value_unchecked(l_idx);
-                                let v = $OP(l, r);
-                                out_ptr.add(l_idx).write(v);
-                            }
-                        }
-                    }
-                });
+                    let (offsets, validities, _) = core::mem::take(&mut self.data_lhs);
+                    assert_eq!(offsets.len(), 1);
 
-                unsafe { out_vec.set_len(n_values) }
+                    self.finish_offsets_and_validities(Box::new(arr), offsets, validities)
+                },
+                (BinaryOpApplyType::ListToPrimitive, Broadcast::NoBroadcast)
+                    if self.list_to_prim_lhs.is_none() =>
+                {
+                    let offsets_lhs = self.data_lhs.0.as_slice();
 
-                let leaf_validity = combine_validities_list_to_primitive_no_broadcast(
-                    offsets_lhs,
-                    arr_lhs.validity(),
-                    arr_rhs.validity(),
-                    arr_lhs.len(),
-                );
+                    // Notes
+                    // * Primitive indexing starts from 0
+                    // * Output is aligned to LHS array
 
-                let arr =
-                    PrimitiveArray::<T::Native>::from_vec(out_vec).with_validity(leaf_validity);
+                    let n_values = arr_lhs.len();
+                    let mut out_vec = Vec::<T::Native>::with_capacity(n_values);
+                    let out_ptr = out_vec.as_mut_ptr();
 
-                let (offsets, validities, _) = core::mem::take(&mut self.data_lhs);
-                self.finish_offsets_and_validities(Box::new(arr), offsets, validities)
-            },
-            // If we are dispatched here, it means that the LHS array is a unique allocation created
-            // after a unit-length list column was broadcasted, so this codepath mutably stores the
-            // results back into the LHS array to save memory.
-            (BinaryOpApplyType::ListToPrimitive, Broadcast::NoBroadcast) => {
-                let offsets_lhs = self.data_lhs.0.as_slice();
-
-                let (mut arr, n_values) = Option::take(&mut self.list_to_prim_lhs).unwrap();
-                let arr = arr
-                    .as_any_mut()
-                    .downcast_mut::<PrimitiveArray<T::Native>>()
-                    .unwrap();
-                let mut arr_lhs = core::mem::take(arr);
-
-                self.op.prepare_numeric_op_side_validities::<T>(
-                    &mut arr_lhs,
-                    &mut arr_rhs,
-                    self.swapped,
-                );
-
-                let arr_lhs_mut_slice = arr_lhs.get_mut_values().unwrap();
-                assert_eq!(arr_lhs_mut_slice.len(), n_values);
-
-                with_match_numeric_list_op!(&self.op, self.swapped, |$OP| {
-                    for (i, l_range) in OffsetsBuffer::<i64>::leaf_ranges_iter(offsets_lhs).enumerate()
-                    {
-                        let r = unsafe { arr_rhs.value_unchecked(i) };
-                        for l_idx in l_range {
-                            unsafe {
-                                let l = arr_lhs_mut_slice.get_unchecked_mut(l_idx);
-                                *l = $OP(*l, r);
+                    with_match_numeric_list_op!(&self.op, self.swapped, |$OP| {
+                        for (i, l_range) in OffsetsBuffer::<i64>::leaf_ranges_iter(offsets_lhs).enumerate()
+                        {
+                            let r = unsafe { arr_rhs.value_unchecked(i) };
+                            for l_idx in l_range {
+                                unsafe {
+                                    let l = arr_lhs.value_unchecked(l_idx);
+                                    let v = $OP(l, r);
+                                    out_ptr.add(l_idx).write(v);
+                                }
                             }
                         }
-                    }
-                });
+                    });
 
-                let leaf_validity = combine_validities_list_to_primitive_no_broadcast(
-                    offsets_lhs,
-                    arr_lhs.validity(),
-                    arr_rhs.validity(),
-                    arr_lhs.len(),
-                );
+                    unsafe { out_vec.set_len(n_values) }
 
-                let arr = arr_lhs.with_validity(leaf_validity);
+                    let leaf_validity = combine_validities_list_to_primitive_no_broadcast(
+                        offsets_lhs,
+                        arr_lhs.validity(),
+                        arr_rhs.validity(),
+                        arr_lhs.len(),
+                    );
 
-                let (offsets, validities, _) = core::mem::take(&mut self.data_lhs);
-                self.finish_offsets_and_validities(Box::new(arr), offsets, validities)
-            },
-            (BinaryOpApplyType::ListToPrimitive, Broadcast::Right) => {
-                assert_eq!(arr_rhs.len(), 1);
+                    let arr =
+                        PrimitiveArray::<T::Native>::from_vec(out_vec).with_validity(leaf_validity);
 
-                let Some(r) = (unsafe { arr_rhs.get_unchecked(0) }) else {
-                    // RHS is single primitive NULL, create the result by setting the leaf validity to all-NULL.
                     let (offsets, validities, _) = core::mem::take(&mut self.data_lhs);
-                    return self.finish_offsets_and_validities(
-                        Box::new(
-                            arr_lhs
-                                .clone()
-                                .with_validity(Some(Bitmap::new_with_value(false, arr_lhs.len()))),
-                        ),
-                        offsets,
-                        validities,
+                    self.finish_offsets_and_validities(Box::new(arr), offsets, validities)
+                },
+                // If we are dispatched here, it means that the LHS array is a unique allocation created
+                // after a unit-length list column was broadcasted, so this codepath mutably stores the
+                // results back into the LHS array to save memory.
+                (BinaryOpApplyType::ListToPrimitive, Broadcast::NoBroadcast) => {
+                    let offsets_lhs = self.data_lhs.0.as_slice();
+
+                    let (mut arr, n_values) = Option::take(&mut self.list_to_prim_lhs).unwrap();
+                    let arr = arr
+                        .as_any_mut()
+                        .downcast_mut::<PrimitiveArray<T::Native>>()
+                        .unwrap();
+                    let mut arr_lhs = core::mem::take(arr);
+
+                    self.op.prepare_numeric_op_side_validities::<T>(
+                        &mut arr_lhs,
+                        &mut arr_rhs,
+                        self.swapped,
                     );
-                };
 
-                let arr = self.op.apply_array_to_scalar::<T>(arr_lhs, r, self.swapped);
-                let (offsets, validities, _) = core::mem::take(&mut self.data_lhs);
+                    let arr_lhs_mut_slice = arr_lhs.get_mut_values().unwrap();
+                    assert_eq!(arr_lhs_mut_slice.len(), n_values);
 
-                self.finish_offsets_and_validities(Box::new(arr), offsets, validities)
-            },
-            v @ (BinaryOpApplyType::PrimitiveToList, Broadcast::Right)
-            | v @ (BinaryOpApplyType::ListToList, Broadcast::Left)
-            | v @ (BinaryOpApplyType::ListToPrimitive, Broadcast::Left)
-            | v @ (BinaryOpApplyType::PrimitiveToList, Broadcast::Left)
-            | v @ (BinaryOpApplyType::PrimitiveToList, Broadcast::NoBroadcast) => {
-                if cfg!(debug_assertions) {
-                    panic!("operation was not re-written: {:?}", v)
-                } else {
-                    unreachable!()
-                }
-            },
-        }?;
+                    with_match_numeric_list_op!(&self.op, self.swapped, |$OP| {
+                        for (i, l_range) in OffsetsBuffer::<i64>::leaf_ranges_iter(offsets_lhs).enumerate()
+                        {
+                            let r = unsafe { arr_rhs.value_unchecked(i) };
+                            for l_idx in l_range {
+                                unsafe {
+                                    let l = arr_lhs_mut_slice.get_unchecked_mut(l_idx);
+                                    *l = $OP(*l, r);
+                                }
+                            }
+                        }
+                    });
 
-        Ok(out)
-    }
+                    let leaf_validity = combine_validities_list_to_primitive_no_broadcast(
+                        offsets_lhs,
+                        arr_lhs.validity(),
+                        arr_rhs.validity(),
+                        arr_lhs.len(),
+                    );
 
-    /// Construct the result `ListChunked` from the leaf array and the offsets/validities of every
-    /// level.
-    fn finish_offsets_and_validities(
-        &mut self,
-        leaf_array: Box<dyn Array>,
-        offsets: Vec<OffsetsBuffer<i64>>,
-        validities: Vec<Option<Bitmap>>,
-    ) -> PolarsResult<ListChunked> {
-        assert!(!offsets.is_empty());
-        assert_eq!(offsets.len(), validities.len());
-        let mut results = leaf_array;
-
-        let mut iter = offsets.into_iter().zip(validities).rev();
-
-        while iter.len() > 1 {
-            let (offsets, validity) = iter.next().unwrap();
-            let dtype = LargeListArray::default_datatype(results.dtype().clone());
-            results = Box::new(LargeListArray::new(dtype, offsets, results, validity));
+                    let arr = arr_lhs.with_validity(leaf_validity);
+
+                    let (offsets, validities, _) = core::mem::take(&mut self.data_lhs);
+                    self.finish_offsets_and_validities(Box::new(arr), offsets, validities)
+                },
+                (BinaryOpApplyType::ListToPrimitive, Broadcast::Right) => {
+                    assert_eq!(arr_rhs.len(), 1);
+
+                    let Some(r) = (unsafe { arr_rhs.get_unchecked(0) }) else {
+                        // RHS is single primitive NULL, create the result by setting the leaf validity to all-NULL.
+                        let (offsets, validities, _) = core::mem::take(&mut self.data_lhs);
+                        return self.finish_offsets_and_validities(
+                            Box::new(
+                                arr_lhs.clone().with_validity(Some(Bitmap::new_with_value(
+                                    false,
+                                    arr_lhs.len(),
+                                ))),
+                            ),
+                            offsets,
+                            validities,
+                        );
+                    };
+
+                    let arr = self.op.apply_array_to_scalar::<T>(arr_lhs, r, self.swapped);
+                    let (offsets, validities, _) = core::mem::take(&mut self.data_lhs);
+
+                    self.finish_offsets_and_validities(Box::new(arr), offsets, validities)
+                },
+                v @ (BinaryOpApplyType::PrimitiveToList, Broadcast::Right)
+                | v @ (BinaryOpApplyType::ListToList, Broadcast::Left)
+                | v @ (BinaryOpApplyType::ListToPrimitive, Broadcast::Left)
+                | v @ (BinaryOpApplyType::PrimitiveToList, Broadcast::Left)
+                | v @ (BinaryOpApplyType::PrimitiveToList, Broadcast::NoBroadcast) => {
+                    if cfg!(debug_assertions) {
+                        panic!("operation was not re-written: {:?}", v)
+                    } else {
+                        unreachable!()
+                    }
+                },
+            }?;
+
+            Ok(out)
         }
 
-        // The combined outer validity is pre-computed during `try_new()`
-        let (offsets, _) = iter.next().unwrap();
-        let validity = core::mem::take(&mut self.outer_validity);
-        let dtype = LargeListArray::default_datatype(results.dtype().clone());
-        let results = LargeListArray::new(dtype, offsets, results, Some(validity));
+        /// Construct the result `ListChunked` from the leaf array and the offsets/validities of every
+        /// level.
+        fn finish_offsets_and_validities(
+            &mut self,
+            leaf_array: Box<dyn Array>,
+            offsets: Vec<OffsetsBuffer<i64>>,
+            validities: Vec<Option<Bitmap>>,
+        ) -> PolarsResult<ListChunked> {
+            assert!(!offsets.is_empty());
+            assert_eq!(offsets.len(), validities.len());
+            let mut results = leaf_array;
+
+            let mut iter = offsets.into_iter().zip(validities).rev();
+
+            while iter.len() > 1 {
+                let (offsets, validity) = iter.next().unwrap();
+                let dtype = LargeListArray::default_datatype(results.dtype().clone());
+                results = Box::new(LargeListArray::new(dtype, offsets, results, validity));
+            }
 
-        Ok(ListChunked::with_chunk(
-            core::mem::take(&mut self.output_name),
-            results,
-        ))
-    }
+            // The combined outer validity is pre-computed during `try_new()`
+            let (offsets, _) = iter.next().unwrap();
+            let validity = core::mem::take(&mut self.outer_validity);
+            let dtype = LargeListArray::default_datatype(results.dtype().clone());
+            let results = LargeListArray::new(dtype, offsets, results, Some(validity));
 
-    fn materialize_broadcasted_list(
-        side_data: &mut (Vec<OffsetsBuffer<i64>>, Vec<Option<Bitmap>>, Series),
-        output_len: usize,
-        output_primitive_dtype: &DataType,
-    ) -> (Box<dyn Array>, usize) {
-        let s = &side_data.2;
-        assert_eq!(s.len(), 1);
-
-        let expected_n_values = {
-            let offsets = s.list_offsets_and_validities_recursive().0;
-            output_len * OffsetsBuffer::<i64>::leaf_full_start_end(&offsets).len()
-        };
-
-        let ca = s.list().unwrap();
-        // Remember to cast the leaf primitives to the supertype.
-        let ca = ca
-            .cast(&ca.dtype().cast_leaf(output_primitive_dtype.clone()))
-            .unwrap();
-        assert!(output_len > 1); // In case there is a fast-path that doesn't give us owned data.
-        let ca = ca.new_from_index(0, output_len).rechunk();
-
-        let s = ca.into_series();
-
-        *side_data = {
-            let (a, b) = s.list_offsets_and_validities_recursive();
-            // `Series::default()`: This field in the tuple is no longer used.
-            (a, b, Series::default())
-        };
-
-        let n_values = OffsetsBuffer::<i64>::leaf_full_start_end(&side_data.0).len();
-        assert_eq!(n_values, expected_n_values);
-
-        let mut s = s.get_leaf_array();
-        let v = unsafe { s.chunks_mut() };
-
-        assert_eq!(v.len(), 1);
-        (v.swap_remove(0), n_values)
-    }
-}
+            Ok(ListChunked::with_chunk(
+                core::mem::take(&mut self.output_name),
+                results,
+            ))
+        }
 
-/// Used in 2 places, so it's outside here.
-#[inline(never)]
-fn combine_validities_list_to_primitive_no_broadcast(
-    offsets_lhs: &[OffsetsBuffer<i64>],
-    validity_lhs: Option<&Bitmap>,
-    validity_rhs: Option<&Bitmap>,
-    len_lhs: usize,
-) -> Option<Bitmap> {
-    match (validity_lhs, validity_rhs) {
-        (Some(l), Some(r)) => Some((l.clone().make_mut(), r)),
-        (Some(v), None) => return Some(v.clone()),
-        // Materialize a full-true validity to re-use the codepath, as we still
-        // need to spread the bits from the RHS to the correct positions.
-        (None, Some(v)) => Some((Bitmap::new_with_value(true, len_lhs).make_mut(), v)),
-        (None, None) => None,
+        fn materialize_broadcasted_list(
+            side_data: &mut (Vec<OffsetsBuffer<i64>>, Vec<Option<Bitmap>>, Series),
+            output_len: usize,
+            output_primitive_dtype: &DataType,
+        ) -> (Box<dyn Array>, usize) {
+            let s = &side_data.2;
+            assert_eq!(s.len(), 1);
+
+            let expected_n_values = {
+                let offsets = s.list_offsets_and_validities_recursive().0;
+                output_len * OffsetsBuffer::<i64>::leaf_full_start_end(&offsets).len()
+            };
+
+            let ca = s.list().unwrap();
+            // Remember to cast the leaf primitives to the supertype.
+            let ca = ca
+                .cast(&ca.dtype().cast_leaf(output_primitive_dtype.clone()))
+                .unwrap();
+            assert!(output_len > 1); // In case there is a fast-path that doesn't give us owned data.
+            let ca = ca.new_from_index(0, output_len).rechunk();
+
+            let s = ca.into_series();
+
+            *side_data = {
+                let (a, b) = s.list_offsets_and_validities_recursive();
+                // `Series::default()`: This field in the tuple is no longer used.
+                (a, b, Series::default())
+            };
+
+            let n_values = OffsetsBuffer::<i64>::leaf_full_start_end(&side_data.0).len();
+            assert_eq!(n_values, expected_n_values);
+
+            let mut s = s.get_leaf_array();
+            let v = unsafe { s.chunks_mut() };
+
+            assert_eq!(v.len(), 1);
+            (v.swap_remove(0), n_values)
+        }
     }
-    .map(|(mut validity_out, validity_rhs)| {
-        for (i, l_range) in OffsetsBuffer::<i64>::leaf_ranges_iter(offsets_lhs).enumerate() {
-            let r_valid = unsafe { validity_rhs.get_bit_unchecked(i) };
-            for l_idx in l_range {
-                let l_valid = unsafe { validity_out.get_unchecked(l_idx) };
-                let is_valid = l_valid & r_valid;
-
-                // Size and alignment of validity vec are based on LHS.
-                unsafe { validity_out.set_unchecked(l_idx, is_valid) };
-            }
+
+    /// Used in 2 places, so it's outside here.
+    #[inline(never)]
+    fn combine_validities_list_to_primitive_no_broadcast(
+        offsets_lhs: &[OffsetsBuffer<i64>],
+        validity_lhs: Option<&Bitmap>,
+        validity_rhs: Option<&Bitmap>,
+        len_lhs: usize,
+    ) -> Option<Bitmap> {
+        match (validity_lhs, validity_rhs) {
+            (Some(l), Some(r)) => Some((l.clone().make_mut(), r)),
+            (Some(v), None) => return Some(v.clone()),
+            // Materialize a full-true validity to re-use the codepath, as we still
+            // need to spread the bits from the RHS to the correct positions.
+            (None, Some(v)) => Some((Bitmap::new_with_value(true, len_lhs).make_mut(), v)),
+            (None, None) => None,
         }
+        .map(|(mut validity_out, validity_rhs)| {
+            for (i, l_range) in OffsetsBuffer::<i64>::leaf_ranges_iter(offsets_lhs).enumerate() {
+                let r_valid = unsafe { validity_rhs.get_bit_unchecked(i) };
+                for l_idx in l_range {
+                    let l_valid = unsafe { validity_out.get_unchecked(l_idx) };
+                    let is_valid = l_valid & r_valid;
+
+                    // Size and alignment of validity vec are based on LHS.
+                    unsafe { validity_out.set_unchecked(l_idx, is_valid) };
+                }
+            }
 
-        validity_out.freeze()
-    })
+            validity_out.freeze()
+        })
+    }
 }
diff --git a/crates/polars-python/Cargo.toml b/crates/polars-python/Cargo.toml
index 616ba491a19a..16423dc4c15a 100644
--- a/crates/polars-python/Cargo.toml
+++ b/crates/polars-python/Cargo.toml
@@ -75,6 +75,7 @@ features = [
   "lazy",
   "list_eval",
   "list_to_struct",
+  "list_arithmetic",
   "array_to_struct",
   "log",
   "mode",
diff --git a/crates/polars/Cargo.toml b/crates/polars/Cargo.toml
index a710011aa045..5baefb2e1ec2 100644
--- a/crates/polars/Cargo.toml
+++ b/crates/polars/Cargo.toml
@@ -184,6 +184,7 @@ list_gather = ["polars-ops/list_gather", "polars-lazy?/list_gather"]
 list_sample = ["polars-lazy?/list_sample"]
 list_sets = ["polars-lazy?/list_sets"]
 list_to_struct = ["polars-ops/list_to_struct", "polars-lazy?/list_to_struct"]
+list_arithmetic = ["polars-core/list_arithmetic"]
 array_to_struct = ["polars-ops/array_to_struct", "polars-lazy?/array_to_struct"]
 log = ["polars-ops/log", "polars-lazy?/log"]
 merge_sorted = ["polars-lazy?/merge_sorted"]