Skip to content

Commit a98c68c

Browse files
committed
groupby -> group_by update
1 parent 7998163 commit a98c68c

File tree

7 files changed

+29
-21
lines changed

7 files changed

+29
-21
lines changed

check_completeness.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -36,16 +36,16 @@
3636
if i not in polars_spec:
3737
print(f"Series.{i} missing from polars spec!")
3838

39-
# groupby
39+
# group_by
4040
spec = dataframe_api.GroupBy().__dir__()
4141
pandas_spec = (
4242
pandas_standard.PandasDataFrame(pd.DataFrame({"a": [1]}), api_version="2023.08-beta")
43-
.groupby(["a"])
43+
.group_by(["a"])
4444
.__dir__()
4545
)
4646
polars_spec = (
4747
polars_standard.PolarsDataFrame(pl.DataFrame({"a": [1]}), api_version="2023.08-beta")
48-
.groupby(["a"])
48+
.group_by(["a"])
4949
.__dir__()
5050
)
5151

@@ -61,7 +61,7 @@
6161
"Sequence",
6262
"column_object",
6363
"dataframe_object",
64-
"groupby_object",
64+
"group_by_object",
6565
"DType",
6666
}
6767
spec = [i for i in dataframe_api.__dir__() if i not in exclude and not i.startswith("_")]

dataframe_api_compat/pandas_standard/pandas_standard.py

Lines changed: 5 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -373,7 +373,7 @@ def _validate_result(self, result: pd.DataFrame) -> None:
373373
# defensive check
374374
raise AssertionError(
375375
"Groupby operation could not be performed on columns "
376-
f"{failed_columns}. Please drop them before calling groupby."
376+
f"{failed_columns}. Please drop them before calling group_by."
377377
)
378378

379379
def size(self) -> PandasDataFrame:
@@ -511,7 +511,7 @@ def dataframe(self) -> pd.DataFrame:
511511
def shape(self) -> tuple[int, int]:
512512
return self.dataframe.shape
513513

514-
def groupby(self, keys: Sequence[str]) -> PandasGroupBy:
514+
def group_by(self, keys: Sequence[str]) -> PandasGroupBy:
515515
if not isinstance(keys, collections.abc.Sequence):
516516
raise TypeError(f"Expected sequence of strings, got: {type(keys)}")
517517
if isinstance(keys, str):
@@ -606,6 +606,9 @@ def rename_columns(self, mapping: Mapping[str, str]) -> PandasDataFrame:
606606
)
607607

608608
def get_column_names(self) -> list[str]:
609+
# DO NOT REMOVE
610+
# This one is used in upstream tests - even if deprecated,
611+
# just leave it in for backwards compatibility
609612
return self.dataframe.columns.tolist()
610613

611614
def sorted_indices(

dataframe_api_compat/polars_standard/polars_standard.py

Lines changed: 7 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -770,7 +770,9 @@ def __init__(self, df: pl.LazyFrame, keys: Sequence[str], api_version: str) -> N
770770
self.df = df
771771
self.keys = keys
772772
self._api_version = api_version
773-
self.group_by = self.df.groupby if pl.__version__ < "0.19.0" else self.df.group_by
773+
self.group_by = (
774+
self.df.group_by if pl.__version__ < "0.19.0" else self.df.group_by
775+
)
774776

775777
def size(self) -> PolarsDataFrame:
776778
result = self.group_by(self.keys).count().rename({"count": "size"})
@@ -866,7 +868,7 @@ def __dataframe_namespace__(self) -> Any:
866868
def dataframe(self) -> pl.LazyFrame:
867869
return self.df
868870

869-
def groupby(self, keys: Sequence[str]) -> PolarsGroupBy:
871+
def group_by(self, keys: Sequence[str]) -> PolarsGroupBy:
870872
return PolarsGroupBy(self.df, keys, api_version=self._api_version)
871873

872874
def get_column_by_name(self, name: str) -> PolarsColumn[DType]:
@@ -938,6 +940,9 @@ def rename_columns(self, mapping: Mapping[str, str]) -> PolarsDataFrame:
938940
)
939941

940942
def get_column_names(self) -> list[str]:
943+
# DO NOT REMOVE
944+
# This one is used in upstream tests - even if deprecated,
945+
# just leave it in for backwards compatibility
941946
return self.dataframe.columns
942947

943948
def __eq__( # type: ignore[override]

tests/groupby/groupby_any_all_test.py

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -17,15 +17,15 @@
1717
("all", [False, True], [False, False]),
1818
],
1919
)
20-
def test_groupby_boolean(
20+
def test_group_by_boolean(
2121
library: str,
2222
aggregation: str,
2323
expected_b: list[bool],
2424
expected_c: list[bool],
2525
request: pytest.FixtureRequest,
2626
) -> None:
2727
df = bool_dataframe_2(library)
28-
result = getattr(df.groupby(["key"]), aggregation)()
28+
result = getattr(df.group_by(["key"]), aggregation)()
2929
# need to sort
3030
idx = result.sorted_indices(["key"])
3131
result = result.get_rows(idx)
@@ -35,9 +35,9 @@ def test_groupby_boolean(
3535
pd.testing.assert_frame_equal(result_pd, expected)
3636

3737

38-
def test_groupby_invalid_any_all(library: str, request: pytest.FixtureRequest) -> None:
38+
def test_group_by_invalid_any_all(library: str, request: pytest.FixtureRequest) -> None:
3939
df = integer_dataframe_4(library)
4040
with pytest.raises((ValueError, SchemaError)):
41-
df.groupby(["key"]).any()
41+
df.group_by(["key"]).any()
4242
with pytest.raises((ValueError, SchemaError)):
43-
df.groupby(["key"]).all()
43+
df.group_by(["key"]).all()

tests/groupby/invalid_test.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -5,11 +5,11 @@
55
from tests.utils import integer_dataframe_1
66

77

8-
def test_groupby_invalid(library: str) -> None:
8+
def test_group_by_invalid(library: str) -> None:
99
df = integer_dataframe_1(library).select(["a"])
1010
with pytest.raises((KeyError, TypeError)):
11-
df.groupby(0)
11+
df.group_by(0)
1212
with pytest.raises((KeyError, TypeError)):
13-
df.groupby("0")
13+
df.group_by("0")
1414
with pytest.raises((KeyError, TypeError)):
15-
df.groupby(["b"])
15+
df.group_by(["b"])

tests/groupby/numeric_test.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -25,15 +25,15 @@
2525
("var", [0.5, 0.5], [0.5, 0.5]),
2626
],
2727
)
28-
def test_groupby_numeric(
28+
def test_group_by_numeric(
2929
library: str,
3030
aggregation: str,
3131
expected_b: list[float],
3232
expected_c: list[float],
3333
request: pytest.FixtureRequest,
3434
) -> None:
3535
df = integer_dataframe_4(library)
36-
result = getattr(df.groupby(["key"]), aggregation)()
36+
result = getattr(df.group_by(["key"]), aggregation)()
3737
sorted_indices = result.sorted_indices(["key"])
3838
result = result.get_rows(sorted_indices)
3939
result_pd = interchange_to_pandas(result, library)

tests/groupby/size_test.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -12,9 +12,9 @@
1212
import pytest
1313

1414

15-
def test_groupby_size(library: str, request: pytest.FixtureRequest) -> None:
15+
def test_group_by_size(library: str, request: pytest.FixtureRequest) -> None:
1616
df = integer_dataframe_4(library)
17-
result = df.groupby(["key"]).size()
17+
result = df.group_by(["key"]).size()
1818
# got to sort
1919
idx = result.sorted_indices(["key"])
2020
result = result.get_rows(idx)

0 commit comments

Comments
 (0)