narwhals-dev · MarcoGorelli · Aug 18, 2025 · Aug 17, 2025 · Aug 17, 2025 · Aug 17, 2025
diff --git a/narwhals/_arrow/dataframe.py b/narwhals/_arrow/dataframe.py
@@ -21,6 +21,7 @@
     parse_columns_to_drop,
     scale_bytes,
     supports_arrow_c_stream,
+    zip_strict,
 )
 from narwhals.dependencies import is_numpy_array_1d
 from narwhals.exceptions import ShapeError
@@ -202,7 +203,7 @@ def rows(self, *, named: bool) -> list[tuple[Any, ...]] | list[dict[str, Any]]:
         return self.native.to_pylist()
 
     def iter_columns(self) -> Iterator[ArrowSeries]:
-        for name, series in zip(self.columns, self.native.itercolumns()):
+        for name, series in zip_strict(self.columns, self.native.itercolumns()):
             yield ArrowSeries.from_native(series, context=self, name=name)
 
     _iter_columns = iter_columns
@@ -216,7 +217,7 @@ def iter_rows(
         if not named:
             for i in range(0, num_rows, buffer_size):
                 rows = df[i : i + buffer_size].to_pydict().values()
-                yield from zip(*rows)
+                yield from zip_strict(*rows)
         else:
             for i in range(0, num_rows, buffer_size):
                 yield from df[i : i + buffer_size].to_pylist()
@@ -287,10 +288,9 @@ def _select_multi_name(
 
     @property
     def schema(self) -> dict[str, DType]:
-        schema = self.native.schema
         return {
-            name: native_to_narwhals_dtype(dtype, self._version)
-            for name, dtype in zip(schema.names, schema.types)
+            field.name: native_to_narwhals_dtype(field.type, self._version)
+            for field in self.native.schema
         }
 
     def collect_schema(self) -> dict[str, DType]:
@@ -431,7 +431,7 @@ def sort(self, *by: str, descending: bool | Sequence[bool], nulls_last: bool) ->
         else:
             sorting = [
                 (key, "descending" if is_descending else "ascending")
-                for key, is_descending in zip(by, descending)
+                for key, is_descending in zip_strict(by, descending)
             ]
 
         null_placement = "at_end" if nulls_last else "at_start"

diff --git a/narwhals/_compliant/expr.py b/narwhals/_compliant/expr.py
@@ -28,7 +28,7 @@
     LazyExprT,
     NativeExprT,
 )
-from narwhals._utils import _StoresCompliant, qualified_type_name
+from narwhals._utils import _StoresCompliant, qualified_type_name, zip_strict
 from narwhals.dependencies import is_numpy_array, is_numpy_scalar
 
 if TYPE_CHECKING:
@@ -282,13 +282,13 @@ def func(df: EagerDataFrameT) -> list[EagerSeriesT]:
             if alias_output_names:
                 return [
                     series.alias(name)
-                    for series, name in zip(
+                    for series, name in zip_strict(
                         self(df), alias_output_names(self._evaluate_output_names(df))
                     )
                 ]
             return [
                 series.alias(name)
-                for series, name in zip(self(df), self._evaluate_output_names(df))
+                for series, name in zip_strict(self(df), self._evaluate_output_names(df))
             ]
 
         return self.__class__(
@@ -772,7 +772,7 @@ def func(df: EagerDataFrameT) -> Sequence[EagerSeriesT]:
                 )
                 result = tuple(
                     from_numpy(array).alias(output_name)
-                    for array, output_name in zip(udf_series_out, output_names)
+                    for array, output_name in zip_strict(udf_series_out, output_names)
                 )
             else:
                 result = udf_series_out

diff --git a/narwhals/_compliant/group_by.py b/narwhals/_compliant/group_by.py
@@ -16,7 +16,7 @@
     EagerExprT_contra,
     NarwhalsAggregation,
 )
-from narwhals._utils import is_sequence_of
+from narwhals._utils import is_sequence_of, zip_strict
 
 if TYPE_CHECKING:
     from collections.abc import Iterable, Iterator, Mapping, Sequence
@@ -115,7 +115,7 @@ def _temporary_name(key: str) -> str:
             if (metadata := key._metadata) and metadata.expansion_kind.is_multi_output()
             # otherwise it's single named and we can use Expr.alias
             else key.alias(_temporary_name(new_names[0]))
-            for key, new_names in zip(keys, keys_aliases)
+            for key, new_names in zip_strict(keys, keys_aliases)
         ]
         return (
             compliant_frame.with_columns(*safe_keys),

diff --git a/narwhals/_compliant/selectors.py b/narwhals/_compliant/selectors.py
@@ -12,6 +12,7 @@
     dtype_matches_time_unit_and_time_zone,
     get_column_names,
     is_compliant_dataframe,
+    zip_strict,
 )
 
 if TYPE_CHECKING:
@@ -77,7 +78,7 @@ def _iter_columns_dtypes(
     ) -> Iterator[tuple[SeriesOrExprT, DType]]: ...
 
     def _iter_columns_names(self, df: FrameT, /) -> Iterator[tuple[SeriesOrExprT, str]]:
-        yield from zip(self._iter_columns(df), df.columns)
+        yield from zip_strict(self._iter_columns(df), df.columns)
 
     def _is_dtype(
         self: CompliantSelectorNamespace[FrameT, SeriesOrExprT], dtype: type[DType], /
@@ -192,7 +193,7 @@ def _iter_columns(self, df: LazyFrameT) -> Iterator[ExprT]:
         yield from df._iter_columns()
 
     def _iter_columns_dtypes(self, df: LazyFrameT, /) -> Iterator[tuple[ExprT, DType]]:
-        yield from zip(self._iter_columns(df), df.schema.values())
+        yield from zip_strict(self._iter_columns(df), df.schema.values())
 
 
 class CompliantSelector(
@@ -244,7 +245,9 @@ def __sub__(
             def series(df: FrameT) -> Sequence[SeriesOrExprT]:
                 lhs_names, rhs_names = _eval_lhs_rhs(df, self, other)
                 return [
-                    x for x, name in zip(self(df), lhs_names) if name not in rhs_names
+                    x
+                    for x, name in zip_strict(self(df), lhs_names)
+                    if name not in rhs_names
                 ]
 
             def names(df: FrameT) -> Sequence[str]:
@@ -268,7 +271,11 @@ def __or__(
             def series(df: FrameT) -> Sequence[SeriesOrExprT]:
                 lhs_names, rhs_names = _eval_lhs_rhs(df, self, other)
                 return [
-                    *(x for x, name in zip(self(df), lhs_names) if name not in rhs_names),
+                    *(
+                        x
+                        for x, name in zip_strict(self(df), lhs_names)
+                        if name not in rhs_names
+                    ),
                     *other(df),
                 ]
 
@@ -292,7 +299,9 @@ def __and__(
 
             def series(df: FrameT) -> Sequence[SeriesOrExprT]:
                 lhs_names, rhs_names = _eval_lhs_rhs(df, self, other)
-                return [x for x, name in zip(self(df), lhs_names) if name in rhs_names]
+                return [
+                    x for x, name in zip_strict(self(df), lhs_names) if name in rhs_names
+                ]
 
             def names(df: FrameT) -> Sequence[str]:
                 lhs_names, rhs_names = _eval_lhs_rhs(df, self, other)

diff --git a/narwhals/_dask/dataframe.py b/narwhals/_dask/dataframe.py
@@ -17,6 +17,7 @@
     generate_temporary_column_name,
     not_implemented,
     parse_columns_to_drop,
+    zip_strict,
 )
 from narwhals.typing import CompliantLazyFrame
 
@@ -284,7 +285,7 @@ def _join_left(
         )
         extra = [
             right_key if right_key not in self.columns else f"{right_key}{suffix}"
-            for left_key, right_key in zip(left_on, right_on)
+            for left_key, right_key in zip_strict(left_on, right_on)
             if right_key != left_key
         ]
         return result_native.drop(columns=extra)

diff --git a/narwhals/_dask/group_by.py b/narwhals/_dask/group_by.py
@@ -7,6 +7,7 @@
 
 from narwhals._compliant import DepthTrackingGroupBy
 from narwhals._expression_parsing import evaluate_output_names_and_aliases
+from narwhals._utils import zip_strict
 
 if TYPE_CHECKING:
     from collections.abc import Mapping, Sequence
@@ -138,7 +139,7 @@ def agg(self, *exprs: DaskExpr) -> DaskLazyFrame:
             agg_fn = agg_fn(**expr._scalar_kwargs) if callable(agg_fn) else agg_fn
             simple_aggregations.update(
                 (alias, (output_name, agg_fn))
-                for alias, output_name in zip(aliases, output_names)
+                for alias, output_name in zip_strict(aliases, output_names)
             )
         return DaskLazyFrame(
             self._grouped.agg(**simple_aggregations).reset_index(),

diff --git a/narwhals/_dask/namespace.py b/narwhals/_dask/namespace.py
@@ -26,7 +26,7 @@
     combine_alias_output_names,
     combine_evaluate_output_names,
 )
-from narwhals._utils import Implementation
+from narwhals._utils import Implementation, zip_strict
 
 if TYPE_CHECKING:
     from collections.abc import Iterable, Sequence
@@ -263,15 +263,17 @@ def func(df: DaskLazyFrame) -> list[dx.Series]:
                 )
             else:
                 init_value, *values = [
-                    s.where(~nm, "") for s, nm in zip(series, null_mask)
+                    s.where(~nm, "") for s, nm in zip_strict(series, null_mask)
                 ]
 
                 separators = (
                     nm.map({True: "", False: separator}, meta=str)
                     for nm in null_mask[:-1]
                 )
                 result = reduce(
-                    operator.add, (s + v for s, v in zip(separators, values)), init_value
+                    operator.add,
+                    (s + v for s, v in zip_strict(separators, values)),
+                    init_value,
                 )
 
             return [result]

diff --git a/narwhals/_duckdb/dataframe.py b/narwhals/_duckdb/dataframe.py
@@ -26,6 +26,7 @@
     not_implemented,
     parse_columns_to_drop,
     requires,
+    zip_strict,
 )
 from narwhals.dependencies import get_duckdb
 from narwhals.exceptions import InvalidOperationError
@@ -231,7 +232,9 @@ def schema(self) -> dict[str, DType]:
             column_name: native_to_narwhals_dtype(
                 duckdb_dtype, self._version, deferred_time_zone
             )
-            for column_name, duckdb_dtype in zip(self.native.columns, self.native.types)
+            for column_name, duckdb_dtype in zip_strict(
+                self.native.columns, self.native.types
+            )
         }
 
     @property
@@ -295,7 +298,7 @@ def join(
             assert right_on is not None  # noqa: S101
             it = (
                 col(f'lhs."{left}"') == col(f'rhs."{right}"')
-                for left, right in zip(left_on, right_on)
+                for left, right in zip_strict(left_on, right_on)
             )
             condition: Expression = reduce(and_, it)
             rel = self.native.set_alias("lhs").join(
@@ -340,7 +343,7 @@ def join_asof(
         if by_left is not None and by_right is not None:
             conditions.extend(
                 col(f'lhs."{left}"') == col(f'rhs."{right}"')
-                for left, right in zip(by_left, by_right)
+                for left, right in zip_strict(by_left, by_right)
             )
         else:
             by_left = by_right = []
@@ -400,12 +403,12 @@ def sort(self, *by: str, descending: bool | Sequence[bool], nulls_last: bool) ->
         if nulls_last:
             it = (
                 col(name).nulls_last() if not desc else col(name).desc().nulls_last()
-                for name, desc in zip(by, descending)
+                for name, desc in zip_strict(by, descending)
             )
         else:
             it = (
                 col(name).nulls_first() if not desc else col(name).desc().nulls_first()
-                for name, desc in zip(by, descending)
+                for name, desc in zip_strict(by, descending)
             )
         return self._with_native(self.native.sort(*it))
 

diff --git a/narwhals/_duckdb/utils.py b/narwhals/_duckdb/utils.py
@@ -7,7 +7,7 @@
 import duckdb.typing as duckdb_dtypes
 from duckdb.typing import DuckDBPyType
 
-from narwhals._utils import Version, isinstance_or_issubclass
+from narwhals._utils import Version, isinstance_or_issubclass, zip_strict
 from narwhals.exceptions import ColumnNotFoundError
 
 if TYPE_CHECKING:
@@ -302,7 +302,7 @@ def generate_order_by_sql(
         return ""
     by_sql = ",".join(
         f"{parse_into_expression(x)} {DESCENDING_TO_ORDER[_descending]} {NULLS_LAST_TO_NULLS_POS[_nulls_last]}"
-        for x, _descending, _nulls_last in zip(order_by, descending, nulls_last)
+        for x, _descending, _nulls_last in zip_strict(order_by, descending, nulls_last)
     )
     return f"order by {by_sql}"
 

diff --git a/narwhals/_expression_parsing.py b/narwhals/_expression_parsing.py
@@ -8,7 +8,7 @@
 from itertools import chain
 from typing import TYPE_CHECKING, Any, Literal, TypeVar, cast
 
-from narwhals._utils import is_compliant_expr
+from narwhals._utils import is_compliant_expr, zip_strict
 from narwhals.dependencies import is_narwhals_series, is_numpy_array
 from narwhals.exceptions import InvalidOperationError, MultiOutputExpressionError
 
@@ -104,10 +104,10 @@ def evaluate_output_names_and_aliases(
     if exclude:
         assert expr._metadata is not None  # noqa: S101
         if expr._metadata.expansion_kind.is_multi_unnamed():
-            output_names, aliases = zip(
+            output_names, aliases = zip_strict(
                 *[
                     (x, alias)
-                    for x, alias in zip(output_names, aliases)
+                    for x, alias in zip_strict(output_names, aliases)
                     if x not in exclude
                 ]
             )
@@ -626,6 +626,6 @@ def apply_n_ary_operation(
         compliant_expr.broadcast(kind)
         if broadcast and is_compliant_expr(compliant_expr) and is_scalar_like(kind)
         else compliant_expr
-        for compliant_expr, kind in zip(compliant_exprs, kinds)
+        for compliant_expr, kind in zip_strict(compliant_exprs, kinds)
     )
     return function(*compliant_exprs)
diff --git a/narwhals/_ibis/dataframe.py b/narwhals/_ibis/dataframe.py
@@ -15,6 +15,7 @@
     Version,
     not_implemented,
     parse_columns_to_drop,
+    zip_strict,
 )
 from narwhals.exceptions import ColumnNotFoundError, InvalidOperationError
 
@@ -307,7 +308,7 @@ def _convert_predicates(
             return left_on
         return [
             cast("ir.BooleanColumn", (self.native[left] == other.native[right]))
-            for left, right in zip(left_on, right_on)
+            for left, right in zip_strict(left_on, right_on)
         ]
 
     def collect_schema(self) -> dict[str, DType]:

diff --git a/narwhals/_ibis/expr.py b/narwhals/_ibis/expr.py
@@ -12,7 +12,7 @@
 from narwhals._ibis.expr_struct import IbisExprStructNamespace
 from narwhals._ibis.utils import is_floating, lit, narwhals_to_native_dtype
 from narwhals._sql.expr import SQLExpr
-from narwhals._utils import Implementation, Version, not_implemented
+from narwhals._utils import Implementation, Version, not_implemented, zip_strict
 
 if TYPE_CHECKING:
     from collections.abc import Iterator, Sequence
@@ -128,7 +128,7 @@ def _sort(
         }
         yield from (
             cast("ir.Column", mapping[(_desc, _nulls_last)](col))
-            for col, _desc, _nulls_last in zip(cols, descending, nulls_last)
+            for col, _desc, _nulls_last in zip_strict(cols, descending, nulls_last)
         )
 
     @classmethod

diff --git a/narwhals/_pandas_like/dataframe.py b/narwhals/_pandas_like/dataframe.py
@@ -29,6 +29,7 @@
     generate_temporary_column_name,
     parse_columns_to_drop,
     scale_bytes,
+    zip_strict,
 )
 from narwhals.dependencies import is_pandas_like_dataframe
 from narwhals.exceptions import InvalidOperationError, ShapeError
@@ -561,7 +562,7 @@ def _join_left(
         )
         extra = [
             right_key if right_key not in self.columns else f"{right_key}{suffix}"
-            for left_key, right_key in zip(left_on, right_on)
+            for left_key, right_key in zip_strict(left_on, right_on)
             if right_key != left_key
         ]
         # NOTE: Keep `inplace=True` to avoid making a redundant copy.

diff --git a/narwhals/_pandas_like/group_by.py b/narwhals/_pandas_like/group_by.py
@@ -9,6 +9,7 @@
 from narwhals._compliant import EagerGroupBy
 from narwhals._exceptions import issue_warning
 from narwhals._expression_parsing import evaluate_output_names_and_aliases
+from narwhals._utils import zip_strict
 from narwhals.dependencies import is_pandas_like_dataframe
 
 if TYPE_CHECKING:
@@ -283,7 +284,7 @@ def fn(df: pd.DataFrame) -> pd.Series[Any]:
                 for expr in exprs
                 for keys in expr(compliant)
             )
-            out_group, out_names = zip(*results) if results else ([], [])
+            out_group, out_names = zip_strict(*results) if results else ([], [])
             return into_series(out_group, index=out_names, context=ns).native
 
         return fn