pandas-dev
diff --git a/‎.github/workflows/dependabot.yml
Lines changed: 9 additions & 0 deletions b/‎.github/workflows/dependabot.yml
Lines changed: 9 additions & 0 deletions
diff --git a/‎.pre-commit-config.yaml
Lines changed: 3 additions & 11 deletions b/‎.pre-commit-config.yaml
Lines changed: 3 additions & 11 deletions
diff --git a/‎ci/code_checks.sh
Lines changed: 0 additions & 3 deletions b/‎ci/code_checks.sh
Lines changed: 0 additions & 3 deletions
diff --git a/‎doc/source/_static/reshaping_pivot.png
5.17 KB b/‎doc/source/_static/reshaping_pivot.png
5.17 KB
diff --git a/‎doc/source/getting_started/tutorials.rst
Lines changed: 1 addition & 1 deletion b/‎doc/source/getting_started/tutorials.rst
Lines changed: 1 addition & 1 deletion
diff --git a/‎doc/source/user_guide/reshaping.rst
Lines changed: 1 addition & 1 deletion b/‎doc/source/user_guide/reshaping.rst
Lines changed: 1 addition & 1 deletion
diff --git a/‎doc/source/whatsnew/v2.0.0.rst
Lines changed: 1 addition & 0 deletions b/‎doc/source/whatsnew/v2.0.0.rst
Lines changed: 1 addition & 0 deletions
diff --git a/‎doc/source/whatsnew/v2.1.0.rst
Lines changed: 2 additions & 0 deletions b/‎doc/source/whatsnew/v2.1.0.rst
Lines changed: 2 additions & 0 deletions
diff --git a/‎pandas/_config/config.py
Lines changed: 1 addition & 1 deletion b/‎pandas/_config/config.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎pandas/_libs/tslibs/timedeltas.pyx
Lines changed: 25 additions & 2 deletions b/‎pandas/_libs/tslibs/timedeltas.pyx
Lines changed: 25 additions & 2 deletions
diff --git a/‎pandas/_testing/_random.py
Lines changed: 3 additions & 1 deletion b/‎pandas/_testing/_random.py
Lines changed: 3 additions & 1 deletion
diff --git a/‎pandas/_testing/contexts.py
Lines changed: 1 addition & 1 deletion b/‎pandas/_testing/contexts.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎pandas/compat/numpy/function.py
Lines changed: 1 addition & 1 deletion b/‎pandas/compat/numpy/function.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎pandas/core/accessor.py
Lines changed: 9 additions & 9 deletions b/‎pandas/core/accessor.py
Lines changed: 9 additions & 9 deletions
diff --git a/‎pandas/core/arrays/_mixins.py
Lines changed: 2 additions & 2 deletions b/‎pandas/core/arrays/_mixins.py
Lines changed: 2 additions & 2 deletions
diff --git a/‎pandas/core/arrays/arrow/array.py
Lines changed: 1 addition & 1 deletion b/‎pandas/core/arrays/arrow/array.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎pandas/core/arrays/base.py
Lines changed: 1 addition & 1 deletion b/‎pandas/core/arrays/base.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎pandas/core/arrays/categorical.py
Lines changed: 7 additions & 3 deletions b/‎pandas/core/arrays/categorical.py
Lines changed: 7 additions & 3 deletions
diff --git a/‎pandas/core/arrays/datetimes.py
Lines changed: 1 addition & 1 deletion b/‎pandas/core/arrays/datetimes.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎pandas/core/arrays/interval.py
Lines changed: 1 addition & 1 deletion b/‎pandas/core/arrays/interval.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎pandas/core/arrays/masked.py
Lines changed: 1 addition & 1 deletion b/‎pandas/core/arrays/masked.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎pandas/core/arrays/period.py
Lines changed: 2 additions & 2 deletions b/‎pandas/core/arrays/period.py
Lines changed: 2 additions & 2 deletions
diff --git a/‎pandas/core/arrays/sparse/accessor.py
Lines changed: 2 additions & 2 deletions b/‎pandas/core/arrays/sparse/accessor.py
Lines changed: 2 additions & 2 deletions
@@ -0,0 +1,9 @@
+version: 2
+updates:
+  - package-ecosystem: github-actions
+    directory: /
+    schedule:
+      interval: weekly
+    labels:
+      - "CI"
+      - "Dependencies"
@@ -28,7 +28,7 @@ repos:
         types_or: [python, pyi]
         additional_dependencies: [black==23.1.0]
 -   repo: https://github.com/charliermarsh/ruff-pre-commit
-    rev: v0.0.255
+    rev: v0.0.259
     hooks:
     -   id: ruff
         args: [--exit-non-zero-on-fix]
@@ -392,14 +392,6 @@ repos:
         files: ^pandas/
         exclude: ^(pandas/_libs/|pandas/tests/|pandas/errors/__init__.py$|pandas/_version.py)
         types: [python]
-    -   id: flake8-pyi
-        name: flake8-pyi
-        entry: flake8 --extend-ignore=E301,E302,E305,E701,E704
-        types: [pyi]
-        language: python
-        additional_dependencies:
-        - flake8==5.0.4
-        - flake8-pyi==22.8.1
     -   id: future-annotations
         name: import annotations from __future__
         entry: 'from __future__ import annotations'
@@ -421,8 +413,8 @@ repos:
         language: python
         stages: [manual]
         additional_dependencies:
-        - autotyping==22.9.0
-        - libcst==0.4.7
+        - autotyping==23.3.0
+        - libcst==0.4.9
     -   id: check-test-naming
         name: check that test names start with 'test'
         entry: python -m scripts.check_test_naming
 
@@ -86,8 +86,6 @@ if [[ -z "$CHECK" || "$CHECK" == "docstrings" ]]; then
     MSG='Partially validate docstrings (EX01)' ;  echo $MSG
     $BASE_DIR/scripts/validate_docstrings.py --format=actions --errors=EX01 --ignore_functions \
         pandas.Series.index \
-        pandas.Series.hasnans \
-        pandas.Series.to_list \
         pandas.Series.__iter__ \
         pandas.Series.keys \
         pandas.Series.item \
@@ -309,7 +307,6 @@ if [[ -z "$CHECK" || "$CHECK" == "docstrings" ]]; then
         pandas_object \
         pandas.api.interchange.from_dataframe \
         pandas.Index.values \
-        pandas.Index.hasnans \
         pandas.Index.dtype \
         pandas.Index.inferred_type \
         pandas.Index.shape \
 
@@ -113,7 +113,7 @@ Various tutorials
 * `Wes McKinney's (pandas BDFL) blog <https://wesmckinney.com/archives.html>`_
 * `Statistical analysis made easy in Python with SciPy and pandas DataFrames, by Randal Olson <http://www.randalolson.com/2012/08/06/statistical-analysis-made-easy-in-python/>`_
 * `Statistical Data Analysis in Python, tutorial videos, by Christopher Fonnesbeck from SciPy 2013 <https://conference.scipy.org/scipy2013/tutorial_detail.php?id=109>`_
-* `Financial analysis in Python, by Thomas Wiecki <https://nbviewer.ipython.org/github/twiecki/financial-analysis-python-tutorial/blob/master/1.%20Pandas%20Basics.ipynb>`_
+* `Financial analysis in Python, by Thomas Wiecki <https://nbviewer.org/github/twiecki/financial-analysis-python-tutorial/blob/master/1.%20Pandas%20Basics.ipynb>`_
 * `Intro to pandas data structures, by Greg Reda <http://www.gregreda.com/2013/10/26/intro-to-pandas-data-structures/>`_
 * `Pandas and Python: Top 10, by Manish Amde <https://manishamde.github.io/blog/2013/03/07/pandas-and-python-top-10/>`_
 * `Pandas DataFrames Tutorial, by Karlijn Willems <https://www.datacamp.com/community/tutorials/pandas-tutorial-dataframe-python>`_
 
@@ -13,7 +13,7 @@ Reshaping by pivoting DataFrame objects
 
 .. image:: ../_static/reshaping_pivot.png
 
-Data is often stored in so-called "stacked" or "record" format:
+Data is often stored in so-called "stacked" or "record" format. In a "record" or "wide" format typically there is one row for each subject. In the "stacked" or "long" format there are multiple rows for each subject where applicable.
 
 .. ipython:: python
 
 
@@ -1190,6 +1190,7 @@ Timedelta
 - Bug in :func:`to_timedelta` raising error when input has nullable dtype ``Float64`` (:issue:`48796`)
 - Bug in :class:`Timedelta` constructor incorrectly raising instead of returning ``NaT`` when given a ``np.timedelta64("nat")`` (:issue:`48898`)
 - Bug in :class:`Timedelta` constructor failing to raise when passed both a :class:`Timedelta` object and keywords (e.g. days, seconds) (:issue:`48898`)
+- Bug in :class:`Timedelta` comparisons with very large ``datetime.timedelta`` objects incorrect raising ``OutOfBoundsTimedelta`` (:issue:`49021`)
 
 Timezones
 ^^^^^^^^^
 
@@ -36,6 +36,7 @@ Other enhancements
 - :class:`api.extensions.ExtensionArray` now has a :meth:`~api.extensions.ExtensionArray.map` method (:issue:`51809`)
 - Improve error message when having incompatible columns using :meth:`DataFrame.merge` (:issue:`51861`)
 - Improved error message when creating a DataFrame with empty data (0 rows), no index and an incorrect number of columns. (:issue:`52084`)
+- :meth:`DataFrame.applymap` now uses the :meth:`~api.extensions.ExtensionArray.map` method of underlying :class:`api.extensions.ExtensionArray` instances (:issue:`52219`)
 - :meth:`arrays.SparseArray.map` now supports ``na_action`` (:issue:`52096`).
 
 .. ---------------------------------------------------------------------------
@@ -114,6 +115,7 @@ Deprecations
 - Deprecated 'method', 'limit', and 'fill_axis' keywords in :meth:`DataFrame.align` and :meth:`Series.align`, explicitly call ``fillna`` on the alignment results instead (:issue:`51856`)
 - Deprecated 'broadcast_axis' keyword in :meth:`Series.align` and :meth:`DataFrame.align`, upcast before calling ``align`` with ``left = DataFrame({col: left for col in right.columns}, index=right.index)`` (:issue:`51856`)
 - Deprecated the 'axis' keyword in :meth:`.GroupBy.idxmax`, :meth:`.GroupBy.idxmin`, :meth:`.GroupBy.fillna`, :meth:`.GroupBy.take`, :meth:`.GroupBy.skew`, :meth:`.GroupBy.rank`, :meth:`.GroupBy.cumprod`, :meth:`.GroupBy.cumsum`, :meth:`.GroupBy.cummax`, :meth:`.GroupBy.cummin`, :meth:`.GroupBy.pct_change`, :meth:`GroupBy.diff`, :meth:`.GroupBy.shift`, and :meth:`DataFrameGroupBy.corrwith`; for ``axis=1`` operate on the underlying :class:`DataFrame` instead (:issue:`50405`, :issue:`51046`)
+- Deprecated :meth:`DataFrame.swapaxes` and :meth:`Series.swapaxes`, use :meth:`DataFrame.transpose` or :meth:`Series.transpose` instead (:issue:`51946`)
 -
 
 .. ---------------------------------------------------------------------------
 
@@ -737,7 +737,7 @@ def pp(name: str, ks: Iterable[str]) -> list[str]:
 
 
 @contextmanager
-def config_prefix(prefix) -> Generator[None, None, None]:
+def config_prefix(prefix: str) -> Generator[None, None, None]:
     """
     contextmanager for multiple invocations of API with a common prefix
 
 
@@ -4,6 +4,10 @@ import warnings
 cimport cython
 from cpython.object cimport (
     Py_EQ,
+    Py_GE,
+    Py_GT,
+    Py_LE,
+    Py_LT,
     Py_NE,
     PyObject,
     PyObject_RichCompare,
@@ -1154,8 +1158,27 @@ cdef class _Timedelta(timedelta):
         if isinstance(other, _Timedelta):
             ots = other
         elif is_any_td_scalar(other):
-            ots = Timedelta(other)
-            # TODO: watch out for overflows
+            try:
+                ots = Timedelta(other)
+            except OutOfBoundsTimedelta as err:
+                # GH#49021 pytimedelta.max overflows
+                if not PyDelta_Check(other):
+                    # TODO: handle this case
+                    raise
+                ltup = (self.days, self.seconds, self.microseconds, self.nanoseconds)
+                rtup = (other.days, other.seconds, other.microseconds, 0)
+                if op == Py_EQ:
+                    return ltup == rtup
+                elif op == Py_NE:
+                    return ltup != rtup
+                elif op == Py_LT:
+                    return ltup < rtup
+                elif op == Py_LE:
+                    return ltup <= rtup
+                elif op == Py_GT:
+                    return ltup > rtup
+                elif op == Py_GE:
+                    return ltup >= rtup
 
         elif other is NaT:
             return op == Py_NE
 
@@ -10,7 +10,9 @@
 RANDS_CHARS = np.array(list(string.ascii_letters + string.digits), dtype=(np.str_, 1))
 
 
-def rands_array(nchars, size, dtype: NpDtype = "O", replace: bool = True) -> np.ndarray:
+def rands_array(
+    nchars, size: int, dtype: NpDtype = "O", replace: bool = True
+) -> np.ndarray:
     """
     Generate an array of byte strings.
     """
 
@@ -154,7 +154,7 @@ def ensure_safe_environment_variables() -> Generator[None, None, None]:
 
 
 @contextmanager
-def with_csv_dialect(name, **kwargs) -> Generator[None, None, None]:
+def with_csv_dialect(name: str, **kwargs) -> Generator[None, None, None]:
     """
     Context manager to temporarily register a CSV dialect for parsing CSV.
 
 
@@ -342,7 +342,7 @@ def validate_take_with_convert(convert: ndarray | bool | None, args, kwargs) ->
 )
 
 
-def validate_groupby_func(name, args, kwargs, allowed=None) -> None:
+def validate_groupby_func(name: str, args, kwargs, allowed=None) -> None:
     """
     'args' and 'kwargs' should be empty, except for allowed kwargs because all
     of their necessary parameters are explicitly listed in the function
 
@@ -51,13 +51,13 @@ class PandasDelegate:
     Abstract base class for delegating methods/properties.
     """
 
-    def _delegate_property_get(self, name, *args, **kwargs):
+    def _delegate_property_get(self, name: str, *args, **kwargs):
         raise TypeError(f"You cannot access the property {name}")
 
-    def _delegate_property_set(self, name, value, *args, **kwargs):
+    def _delegate_property_set(self, name: str, value, *args, **kwargs):
         raise TypeError(f"The property {name} cannot be set")
 
-    def _delegate_method(self, name, *args, **kwargs):
+    def _delegate_method(self, name: str, *args, **kwargs):
         raise TypeError(f"You cannot call method {name}")
 
     @classmethod
@@ -91,7 +91,7 @@ def _add_delegate_accessors(
             False skips the missing accessor.
         """
 
-        def _create_delegator_property(name):
+        def _create_delegator_property(name: str):
             def _getter(self):
                 return self._delegate_property_get(name)
 
@@ -107,7 +107,7 @@ def _setter(self, new_values):
                 doc=getattr(delegate, accessor_mapping(name)).__doc__,
             )
 
-        def _create_delegator_method(name):
+        def _create_delegator_method(name: str):
             def f(self, *args, **kwargs):
                 return self._delegate_method(name, *args, **kwargs)
 
@@ -231,7 +231,7 @@ def __get__(self, obj, cls):
 
 
 @doc(klass="", others="")
-def _register_accessor(name, cls):
+def _register_accessor(name: str, cls):
     """
     Register a custom accessor on {klass} objects.
 
@@ -320,21 +320,21 @@ def decorator(accessor):
 
 
 @doc(_register_accessor, klass="DataFrame")
-def register_dataframe_accessor(name):
+def register_dataframe_accessor(name: str):
     from pandas import DataFrame
 
     return _register_accessor(name, DataFrame)
 
 
 @doc(_register_accessor, klass="Series")
-def register_series_accessor(name):
+def register_series_accessor(name: str):
     from pandas import Series
 
     return _register_accessor(name, Series)
 
 
 @doc(_register_accessor, klass="Index")
-def register_index_accessor(name):
+def register_index_accessor(name: str):
     from pandas import Index
 
     return _register_accessor(name, Index)
@@ -291,14 +291,14 @@ def __getitem__(
         return result
 
     def _fill_mask_inplace(
-        self, method: str, limit, mask: npt.NDArray[np.bool_]
+        self, method: str, limit: int | None, mask: npt.NDArray[np.bool_]
     ) -> None:
         # (for now) when self.ndim == 2, we assume axis=0
         func = missing.get_fill_func(method, ndim=self.ndim)
         func(self._ndarray.T, limit=limit, mask=mask.T)
 
     @doc(ExtensionArray.fillna)
-    def fillna(self, value=None, method=None, limit=None) -> Self:
+    def fillna(self, value=None, method=None, limit: int | None = None) -> Self:
         value, method = validate_fillna_kwargs(
             value, method, validate_scalar_dict_value=False
         )
 
@@ -1952,7 +1952,7 @@ def _str_translate(self, table):
             "str.translate not supported with pd.ArrowDtype(pa.string())."
         )
 
-    def _str_wrap(self, width, **kwargs):
+    def _str_wrap(self, width: int, **kwargs):
         raise NotImplementedError(
             "str.wrap not supported with pd.ArrowDtype(pa.string())."
         )
 
@@ -1570,7 +1570,7 @@ def _where(self, mask: npt.NDArray[np.bool_], value) -> Self:
         return result
 
     def _fill_mask_inplace(
-        self, method: str, limit, mask: npt.NDArray[np.bool_]
+        self, method: str, limit: int | None, mask: npt.NDArray[np.bool_]
     ) -> None:
         """
         Replace values in locations specified by 'mask' using pad or backfill.
 
@@ -2500,10 +2500,14 @@ def _validate(data):
         if not is_categorical_dtype(data.dtype):
             raise AttributeError("Can only use .cat accessor with a 'category' dtype")
 
-    def _delegate_property_get(self, name):
+    # error: Signature of "_delegate_property_get" incompatible with supertype
+    # "PandasDelegate"
+    def _delegate_property_get(self, name: str):  # type: ignore[override]
         return getattr(self._parent, name)
 
-    def _delegate_property_set(self, name, new_values):
+    # error: Signature of "_delegate_property_set" incompatible with supertype
+    # "PandasDelegate"
+    def _delegate_property_set(self, name: str, new_values):  # type: ignore[override]
         return setattr(self._parent, name, new_values)
 
     @property
@@ -2515,7 +2519,7 @@ def codes(self) -> Series:
 
         return Series(self._parent.codes, index=self._index)
 
-    def _delegate_method(self, name, *args, **kwargs):
+    def _delegate_method(self, name: str, *args, **kwargs):
         from pandas import Series
 
         method = getattr(self._parent, name)
 
@@ -113,7 +113,7 @@ def tz_to_dtype(tz: tzinfo | None, unit: str = "ns"):
         return DatetimeTZDtype(tz=tz, unit=unit)
 
 
-def _field_accessor(name: str, field: str, docstring=None):
+def _field_accessor(name: str, field: str, docstring: str | None = None):
     def f(self):
         values = self._local_timestamps()
 
 
@@ -889,7 +889,7 @@ def max(self, *, axis: AxisInt | None = None, skipna: bool = True) -> IntervalOr
         indexer = obj.argsort()[-1]
         return obj[indexer]
 
-    def fillna(self, value=None, method=None, limit=None) -> Self:
+    def fillna(self, value=None, method=None, limit: int | None = None) -> Self:
         """
         Fill NA/NaN values using the specified method.
 
 
@@ -162,7 +162,7 @@ def __getitem__(self, item: PositionalIndexer) -> Self | Any:
 
     @doc(ExtensionArray.fillna)
     @doc(ExtensionArray.fillna)
-    def fillna(self, value=None, method=None, limit=None) -> Self:
+    def fillna(self, value=None, method=None, limit: int | None = None) -> Self:
         value, method = validate_fillna_kwargs(value, method)
 
         mask = self._mask
 
@@ -98,7 +98,7 @@
 }
 
 
-def _field_accessor(name: str, docstring=None):
+def _field_accessor(name: str, docstring: str | None = None):
     def f(self):
         base = self.freq._period_dtype_code
         result = get_period_field_arr(name, self.asi8, base)
@@ -658,7 +658,7 @@ def searchsorted(
         m8arr = self._ndarray.view("M8[ns]")
         return m8arr.searchsorted(npvalue, side=side, sorter=sorter)
 
-    def fillna(self, value=None, method=None, limit=None) -> PeriodArray:
+    def fillna(self, value=None, method=None, limit: int | None = None) -> PeriodArray:
         if method is not None:
             # view as dt64 so we get treated as timelike in core.missing,
             #  similar to dtl._period_dispatch
 
@@ -46,10 +46,10 @@ def _validate(self, data):
         if not isinstance(data.dtype, SparseDtype):
             raise AttributeError(self._validation_msg)
 
-    def _delegate_property_get(self, name, *args, **kwargs):
+    def _delegate_property_get(self, name: str, *args, **kwargs):
         return getattr(self._parent.array, name)
 
-    def _delegate_method(self, name, *args, **kwargs):
+    def _delegate_method(self, name: str, *args, **kwargs):
         if name == "from_coo":
             return self.from_coo(*args, **kwargs)
         elif name == "to_coo":
Original file line number	Diff line number	Diff line change
`@@ -342,7 +342,7 @@ def validate_take_with_convert(convert: ndarray \| bool \| None, args, kwargs) ->`
`342`	`342`	`)`
`343`	`343`
`344`	`344`
`345`		`-def validate_groupby_func(name, args, kwargs, allowed=None) -> None:`
	`345`	`+def validate_groupby_func(name: str, args, kwargs, allowed=None) -> None:`
`346`	`346`	`"""`
`347`	`347`	`'args' and 'kwargs' should be empty, except for allowed kwargs because all`
`348`	`348`	`of their necessary parameters are explicitly listed in the function`
Original file line number	Diff line number	Diff line change
`@@ -1952,7 +1952,7 @@ def _str_translate(self, table):`
`1952`	`1952`	`"str.translate not supported with pd.ArrowDtype(pa.string())."`
`1953`	`1953`	`)`
`1954`	`1954`
`1955`		`- def _str_wrap(self, width, **kwargs):`
	`1955`	`+ def _str_wrap(self, width: int, **kwargs):`
`1956`	`1956`	`raise NotImplementedError(`
`1957`	`1957`	`"str.wrap not supported with pd.ArrowDtype(pa.string())."`
`1958`	`1958`	`)`