pola-rs · tylerriccio33 · Nov 3, 2024 · Nov 4, 2024 · Nov 4, 2024 · Nov 4, 2024
@@ -8,10 +8,11 @@
 
 if TYPE_CHECKING:
     import sys
-    from collections.abc import Iterable
+    from collections.abc import Iterable, Iterator
     from datetime import timedelta
+    from typing import Any
 
-    from polars import DataFrame
+    from polars import DataFrame, Series
     from polars._typing import (
         ClosedInterval,
         IntoExpr,
@@ -22,9 +23,41 @@
     )
 
     if sys.version_info >= (3, 11):
-        from typing import Self
+        pass
     else:
-        from typing_extensions import Self
+        pass
+
+
+class _GroupByIterator:
+    def __init__(
+        self,
+        df: DataFrame,
+        group_names: Iterator[tuple[Any, ...]],
+        group_indices: Series,
+    ) -> None:
+        self._group_names = group_names
+        self._group_indices = group_indices
+        self._current_index = 0
+        self.df = df
+
+    def __next__(self) -> tuple[tuple[object, ...], DataFrame]:
+        try:
+            end_iter = self._current_index >= len(self._group_indices)
+        except AttributeError:
+            msg = "`next` must be called on an iterable."
+            raise TypeError(msg) from None
+
+        if end_iter:
+            raise StopIteration
+
+        group_name = next(self._group_names)
+        group_data = self.df[self._group_indices[self._current_index], :]
+        self._current_index += 1
+
+        return group_name, group_data
+
+    def __iter__(self) -> _GroupByIterator:
+        return self
 
 
 class GroupBy:
@@ -61,7 +94,7 @@ def __init__(
         self.named_by = named_by
         self.maintain_order = maintain_order
 
-    def __iter__(self) -> Self:
+    def __iter__(self) -> _GroupByIterator:
         """
         Allows iteration over the groups of the group by operation.
 
@@ -108,17 +141,7 @@ def __iter__(self) -> Self:
         self._group_indices = groups_df.select(temp_col).to_series()
         self._current_index = 0
 
-        return self
-
-    def __next__(self) -> tuple[tuple[object, ...], DataFrame]:
-        if self._current_index >= len(self._group_indices):
-            raise StopIteration
-
-        group_name = next(self._group_names)
-        group_data = self.df[self._group_indices[self._current_index], :]
-        self._current_index += 1
-
-        return group_name, group_data
+        return _GroupByIterator(self.df, self._group_names, self._group_indices)
 
     def agg(
         self,
@@ -784,7 +807,7 @@ def __init__(
         self.closed = closed
         self.group_by = group_by
 
-    def __iter__(self) -> Self:
+    def __iter__(self) -> _GroupByIterator:
         temp_col = "__POLARS_GB_GROUP_INDICES"
         groups_df = (
             self.df.lazy()
@@ -803,17 +826,7 @@ def __iter__(self) -> Self:
         self._group_indices = groups_df.select(temp_col).to_series()
         self._current_index = 0
 
-        return self
-
-    def __next__(self) -> tuple[tuple[object, ...], DataFrame]:
-        if self._current_index >= len(self._group_indices):
-            raise StopIteration
-
-        group_name = next(self._group_names)
-        group_data = self.df[self._group_indices[self._current_index], :]
-        self._current_index += 1
-
-        return group_name, group_data
+        return _GroupByIterator(self.df, self._group_names, self._group_indices)
 
     def agg(
         self,
@@ -926,7 +939,7 @@ def __init__(
         self.group_by = group_by
         self.start_by = start_by
 
-    def __iter__(self) -> Self:
+    def __iter__(self) -> _GroupByIterator:
         temp_col = "__POLARS_GB_GROUP_INDICES"
         groups_df = (
             self.df.lazy()
@@ -949,17 +962,7 @@ def __iter__(self) -> Self:
         self._group_indices = groups_df.select(temp_col).to_series()
         self._current_index = 0
 
-        return self
-
-    def __next__(self) -> tuple[tuple[object, ...], DataFrame]:
-        if self._current_index >= len(self._group_indices):
-            raise StopIteration
-
-        group_name = next(self._group_names)
-        group_data = self.df[self._group_indices[self._current_index], :]
-        self._current_index += 1
-
-        return group_name, group_data
+        return _GroupByIterator(self.df, self._group_names, self._group_indices)
 
     def agg(
         self,

@@ -14,6 +14,20 @@
 
 if TYPE_CHECKING:
     from polars._typing import PolarsDataType
+    from polars.dataframe.group_by import _GroupByIterator
+
+
+@pytest.mark.parametrize(
+    "context",
+    [
+        pl.DataFrame().group_by(1),
+        pl.DataFrame().group_by_dynamic(1, every="days"),
+        pl.DataFrame({"int": []}).rolling("int", period="31"),
+    ],
+)
+def test_group_by_no_iter(context: _GroupByIterator) -> None:
+    with pytest.raises(TypeError, match="object is not an iterator"):
+        next(context)
 
 
 def test_group_by() -> None: