pandas-dev
diff --git a/Diff for: ‎.github/workflows/comment-commands.yml
+4-6 b/Diff for: ‎.github/workflows/comment-commands.yml
+4-6
diff --git a/Diff for: ‎.github/workflows/docbuild-and-upload.yml
-7 b/Diff for: ‎.github/workflows/docbuild-and-upload.yml
-7
diff --git a/Diff for: ‎.github/workflows/unit-tests.yml
-12 b/Diff for: ‎.github/workflows/unit-tests.yml
-12
diff --git a/Diff for: ‎.pre-commit-config.yaml
-2 b/Diff for: ‎.pre-commit-config.yaml
-2
diff --git a/Diff for: ‎asv_bench/asv.conf.json
+1-1 b/Diff for: ‎asv_bench/asv.conf.json
+1-1
diff --git a/Diff for: ‎asv_bench/benchmarks/algos/isin.py
+2-1 b/Diff for: ‎asv_bench/benchmarks/algos/isin.py
+2-1
diff --git a/Diff for: ‎asv_bench/benchmarks/frame_methods.py
-2 b/Diff for: ‎asv_bench/benchmarks/frame_methods.py
-2
diff --git a/Diff for: ‎asv_bench/benchmarks/strings.py
+2-1 b/Diff for: ‎asv_bench/benchmarks/strings.py
+2-1
diff --git a/Diff for: ‎ci/code_checks.sh
+2-4 b/Diff for: ‎ci/code_checks.sh
+2-4
diff --git a/Diff for: ‎doc/source/reference/arrays.rst
+15 b/Diff for: ‎doc/source/reference/arrays.rst
+15
diff --git a/Diff for: ‎doc/source/reference/groupby.rst
-2 b/Diff for: ‎doc/source/reference/groupby.rst
-2
diff --git a/Diff for: ‎doc/source/reference/index.rst
+4-3 b/Diff for: ‎doc/source/reference/index.rst
+4-3
diff --git a/Diff for: ‎doc/source/user_guide/groupby.rst
+1-1 b/Diff for: ‎doc/source/user_guide/groupby.rst
+1-1
diff --git a/Diff for: ‎doc/source/whatsnew/v2.0.0.rst
+1-1 b/Diff for: ‎doc/source/whatsnew/v2.0.0.rst
+1-1
diff --git a/Diff for: ‎doc/source/whatsnew/v2.2.1.rst
+2 b/Diff for: ‎doc/source/whatsnew/v2.2.1.rst
+2
diff --git a/Diff for: ‎doc/source/whatsnew/v3.0.0.rst
+4 b/Diff for: ‎doc/source/whatsnew/v3.0.0.rst
+4
diff --git a/Diff for: ‎environment.yml
+1-1 b/Diff for: ‎environment.yml
+1-1
diff --git a/Diff for: ‎pandas/__init__.py
+1-12 b/Diff for: ‎pandas/__init__.py
+1-12
diff --git a/Diff for: ‎pandas/_config/__init__.py
+2-10 b/Diff for: ‎pandas/_config/__init__.py
+2-10
diff --git a/Diff for: ‎pandas/_typing.py
+1-7 b/Diff for: ‎pandas/_typing.py
+1-7
diff --git a/Diff for: ‎pandas/conftest.py
+2-10 b/Diff for: ‎pandas/conftest.py
+2-10
diff --git a/Diff for: ‎pandas/core/apply.py
+2-2 b/Diff for: ‎pandas/core/apply.py
+2-2
diff --git a/Diff for: ‎pandas/core/arraylike.py
+2-5 b/Diff for: ‎pandas/core/arraylike.py
+2-5
diff --git a/Diff for: ‎pandas/core/arrays/base.py
+1-1 b/Diff for: ‎pandas/core/arrays/base.py
+1-1
@@ -24,12 +24,10 @@ jobs:
     concurrency:
       group: ${{ github.actor }}-preview-docs
     steps:
-      - run: |
-          if curl --output /dev/null --silent --head --fail "https://pandas.pydata.org/preview/${{ github.event.issue.number }}/"; then
-            curl -H "Authorization: token ${{ secrets.GITHUB_TOKEN }}" -d '{"body": "Website preview of this PR available at: https://pandas.pydata.org/preview/${{ github.event.issue.number }}/"}' https://api.github.com/repos/${{ github.repository }}/issues/${{ github.event.issue.number }}/comments
-          else
-            curl -H "Authorization: token ${{ secrets.GITHUB_TOKEN }}" -d '{"body": "No preview found for PR #${{ github.event.issue.number }}. Did the docs build complete?"}' https://api.github.com/repos/${{ github.repository }}/issues/${{ github.event.issue.number }}/comments
-          fi
+      - uses: pandas-dev/github-doc-previewer@master
+        with:
+          previewer-server: "https://pandas.pydata.org/preview"
+          artifact-job: "Doc Build and Upload"
   asv_run:
     runs-on: ubuntu-22.04
     # TODO: Support more benchmarking options later, against different branches, against self, etc
 
@@ -90,10 +90,3 @@ jobs:
         name: website
         path: web/build
         retention-days: 14
-
-    - name: Trigger web/doc preview
-      run: curl -X POST https://pandas.pydata.org/preview/submit/$RUN_ID/$PR_ID/
-      env:
-        RUN_ID: ${{ github.run_id }}
-        PR_ID: ${{ github.event.pull_request.number }}
-      if: github.event_name == 'pull_request'
@@ -73,18 +73,6 @@ jobs:
             env_file: actions-312.yaml
             pattern: "not slow and not network and not single_cpu"
             pandas_copy_on_write: "1"
-          - name: "Copy-on-Write 3.11 (warnings)"
-            env_file: actions-311.yaml
-            pattern: "not slow and not network and not single_cpu"
-            pandas_copy_on_write: "warn"
-          - name: "Copy-on-Write 3.10 (warnings)"
-            env_file: actions-310.yaml
-            pattern: "not slow and not network and not single_cpu"
-            pandas_copy_on_write: "warn"
-          - name: "Copy-on-Write 3.9 (warnings)"
-            env_file: actions-39.yaml
-            pattern: "not slow and not network and not single_cpu"
-            pandas_copy_on_write: "warn"
           - name: "Pypy"
             env_file: actions-pypy-39.yaml
             pattern: "not slow and not network and not single_cpu"
 
@@ -101,8 +101,6 @@ repos:
 -   repo: https://github.com/pre-commit/pygrep-hooks
     rev: v1.10.0
     hooks:
-      - id: python-check-blanket-noqa
-      - id: python-check-blanket-type-ignore
       - id: rst-backticks
       - id: rst-directive-colons
         types: [text]  # overwrite types: [rst]
 
@@ -41,7 +41,7 @@
     // pip (with all the conda available packages installed first,
     // followed by the pip installed packages).
     "matrix": {
-        "Cython": ["3.0.5"],
+        "Cython": ["3.0"],
         "matplotlib": [],
         "sqlalchemy": [],
         "scipy": [],
 
@@ -59,7 +59,8 @@ def setup(self, dtype):
         elif dtype in ["str", "string[python]", "string[pyarrow]"]:
             try:
                 self.series = Series(
-                    Index([f"i-{i}" for i in range(N)], dtype=object), dtype=dtype
+                    Index([f"i-{i}" for i in range(N)], dtype=object)._values,
+                    dtype=dtype,
                 )
             except ImportError as err:
                 raise NotImplementedError from err
 
@@ -593,8 +593,6 @@ def setup(self):
         N = 10000
         # this is the worst case, where every column has NaNs.
         arr = np.random.randn(N, 100)
-        # NB: we need to set values in array, not in df.values, otherwise
-        #  the benchmark will be misleading for ArrayManager
         arr[::2] = np.nan
 
         self.df = DataFrame(arr)
 
@@ -19,7 +19,8 @@ class Dtypes:
     def setup(self, dtype):
         try:
             self.s = Series(
-                Index([f"i-{i}" for i in range(10000)], dtype=object), dtype=dtype
+                Index([f"i-{i}" for i in range(10000)], dtype=object)._values,
+                dtype=dtype,
             )
         except ImportError as err:
             raise NotImplementedError from err
 
@@ -93,7 +93,6 @@ if [[ -z "$CHECK" || "$CHECK" == "docstrings" ]]; then
         pandas.TimedeltaIndex.ceil\
         pandas.PeriodIndex\
         pandas.PeriodIndex.strftime\
-        pandas.Series.clip\
         pandas.Series.rename_axis\
         pandas.Series.dt.to_period\
         pandas.Series.dt.tz_localize\
@@ -115,7 +114,6 @@ if [[ -z "$CHECK" || "$CHECK" == "docstrings" ]]; then
         pandas.Series.plot.barh\
         pandas.Series.plot.line\
         pandas.Series.plot.pie\
-        pandas.DataFrame.clip\
         pandas.DataFrame.plot\
         pandas.DataFrame.plot.bar\
         pandas.DataFrame.plot.barh\
@@ -181,10 +179,10 @@ if [[ -z "$CHECK" || "$CHECK" == "docstrings" ]]; then
         pandas.core.groupby.SeriesGroupBy.rolling\
         pandas.core.groupby.DataFrameGroupBy.hist\
         pandas.core.groupby.DataFrameGroupBy.plot\
+        pandas.core.groupby.DataFrameGroupBy.corrwith\
         pandas.core.groupby.SeriesGroupBy.plot\
         pandas.core.window.rolling.Rolling.quantile\
-        pandas.core.window.expanding.Expanding.quantile\
-        pandas.api.extensions.ExtensionArray.argsort # There should be no backslash in the final line, please keep this comment in the last ignored function
+        pandas.core.window.expanding.Expanding.quantile # There should be no backslash in the final line, please keep this comment in the last ignored function
     RET=$(($RET + $?)) ; echo $MSG "DONE"
 
 fi
 
@@ -539,6 +539,21 @@ To create a Series of dtype ``category``, use ``cat = s.astype(dtype)`` or
 If the :class:`Series` is of dtype :class:`CategoricalDtype`, ``Series.cat`` can be used to change the categorical
 data. See :ref:`api.series.cat` for more.
 
+More methods are available on :class:`Categorical`:
+
+.. autosummary::
+   :toctree: api/
+
+   Categorical.as_ordered
+   Categorical.as_unordered
+   Categorical.set_categories
+   Categorical.rename_categories
+   Categorical.reorder_categories
+   Categorical.add_categories
+   Categorical.remove_categories
+   Categorical.remove_unused_categories
+   Categorical.map
+
 .. _api.arrays.sparse:
 
 Sparse
 
@@ -80,7 +80,6 @@ Function application
    DataFrameGroupBy.describe
    DataFrameGroupBy.diff
    DataFrameGroupBy.ffill
-   DataFrameGroupBy.fillna
    DataFrameGroupBy.first
    DataFrameGroupBy.head
    DataFrameGroupBy.idxmax
@@ -131,7 +130,6 @@ Function application
    SeriesGroupBy.describe
    SeriesGroupBy.diff
    SeriesGroupBy.ffill
-   SeriesGroupBy.fillna
    SeriesGroupBy.first
    SeriesGroupBy.head
    SeriesGroupBy.last
 
@@ -24,13 +24,14 @@ The following subpackages are public.
   `pandas-stubs <https://github.com/pandas-dev/pandas-stubs>`_ package
   which has classes in addition to those that occur in pandas for type-hinting.
 
-In addition, public functions in ``pandas.io`` and ``pandas.tseries`` submodules
-are mentioned in the documentation.
+In addition, public functions in ``pandas.io``, ``pandas.tseries``, ``pandas.util`` submodules
+are explicitly mentioned in the documentation. Further APIs in these modules are not guaranteed
+to be stable.
 
 
 .. warning::
 
-    The ``pandas.core``, ``pandas.compat``, and ``pandas.util`` top-level modules are PRIVATE. Stable functionality in such modules is not guaranteed.
+    The ``pandas.core``, ``pandas.compat`` top-level modules are PRIVATE. Stable functionality in such modules is not guaranteed.
 
 .. If you update this toctree, also update the manual toctree in the
 .. main index.rst.template
 
@@ -289,7 +289,7 @@ the number of groups, which is the same as the length of the ``groups`` dictiona
    In [1]: gb.<TAB>  # noqa: E225, E999
    gb.agg        gb.boxplot    gb.cummin     gb.describe   gb.filter     gb.get_group  gb.height     gb.last       gb.median     gb.ngroups    gb.plot       gb.rank       gb.std        gb.transform
    gb.aggregate  gb.count      gb.cumprod    gb.dtype      gb.first      gb.groups     gb.hist       gb.max        gb.min        gb.nth        gb.prod       gb.resample   gb.sum        gb.var
-   gb.apply      gb.cummax     gb.cumsum     gb.fillna     gb.gender     gb.head       gb.indices    gb.mean       gb.name       gb.ohlc       gb.quantile   gb.size       gb.tail       gb.weight
+   gb.apply      gb.cummax     gb.cumsum     gb.gender     gb.head       gb.indices    gb.mean       gb.name       gb.ohlc       gb.quantile   gb.size       gb.tail       gb.weight
 
 .. _groupby.multiindex:
 
 
@@ -732,7 +732,7 @@ or, if your formats are all ISO8601 (but possibly not identically-formatted) ::
 
 Other API changes
 ^^^^^^^^^^^^^^^^^
-- The ``freq``, ``tz``, ``nanosecond``, and ``unit`` keywords in the :class:`Timestamp` constructor are now keyword-only (:issue:`45307`, :issue:`32526`)
+- The ``tz``, ``nanosecond``, and ``unit`` keywords in the :class:`Timestamp` constructor are now keyword-only (:issue:`45307`, :issue:`32526`)
 - Passing ``nanoseconds`` greater than 999 or less than 0 in :class:`Timestamp` now raises a ``ValueError`` (:issue:`48538`, :issue:`48255`)
 - :func:`read_csv`: specifying an incorrect number of columns with ``index_col`` of now raises ``ParserError`` instead of ``IndexError`` when using the c parser.
 - Default value of ``dtype`` in :func:`get_dummies` is changed to ``bool`` from ``uint8`` (:issue:`45848`)
 
@@ -18,6 +18,7 @@ Fixed regressions
 - Fixed regression in :func:`merge_ordered` raising ``TypeError`` for ``fill_method="ffill"`` and ``how="left"`` (:issue:`57010`)
 - Fixed regression in :func:`wide_to_long` raising an ``AttributeError`` for string columns (:issue:`57066`)
 - Fixed regression in :meth:`DataFrame.loc` raising ``IndexError`` for non-unique, masked dtype indexes where result has more than 10,000 rows (:issue:`57027`)
+- Fixed regression in :meth:`DataFrame.sort_index` not producing a stable sort for a index with duplicates (:issue:`57151`)
 - Fixed regression in :meth:`DataFrame.to_dict` with ``orient='list'`` and datetime or timedelta types returning integers (:issue:`54824`)
 - Fixed regression in :meth:`DataFrameGroupBy.idxmin`, :meth:`DataFrameGroupBy.idxmax`, :meth:`SeriesGroupBy.idxmin`, :meth:`SeriesGroupBy.idxmax` ignoring the ``skipna`` argument (:issue:`57040`)
 - Fixed regression in :meth:`DataFrameGroupBy.idxmin`, :meth:`DataFrameGroupBy.idxmax`, :meth:`SeriesGroupBy.idxmin`, :meth:`SeriesGroupBy.idxmax` where values containing the minimum or maximum value for the dtype could produce incorrect results (:issue:`57040`)
@@ -29,6 +30,7 @@ Fixed regressions
 
 Bug fixes
 ~~~~~~~~~
+- Fixed bug in :func:`pandas.api.interchange.from_dataframe` which was raising for empty inputs (:issue:`56700`)
 - Fixed bug in :meth:`DataFrame.__getitem__` for empty :class:`DataFrame` with Copy-on-Write enabled (:issue:`57130`)
 
 .. ---------------------------------------------------------------------------
 
@@ -101,7 +101,11 @@ Deprecations
 
 Removal of prior version deprecations/changes
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+- Removed :meth:`DataFrameGroupby.fillna` and :meth:`SeriesGroupBy.fillna` (:issue:`55719`)
+- Removed ``axis`` argument from all groupby operations (:issue:`50405`)
 - Removed deprecated argument ``obj`` in :meth:`.DataFrameGroupBy.get_group` and :meth:`.SeriesGroupBy.get_group` (:issue:`53545`)
+- Removed the ``ArrayManager`` (:issue:`55043`)
+-
 
 .. ---------------------------------------------------------------------------
 .. _whatsnew_300.performance:
 
@@ -8,7 +8,7 @@ dependencies:
 
   # build dependencies
   - versioneer[toml]
-  - cython=3.0.5
+  - cython~=3.0.5
   - meson[ninja]=1.2.1
   - meson-python=0.13.1
 
 
@@ -1,6 +1,5 @@
 from __future__ import annotations
 
-import os
 import warnings
 
 __docformat__ = "restructuredtext"
@@ -193,16 +192,6 @@
     __git_version__ = v.get("full-revisionid")
     del get_versions, v
 
-# GH#55043 - deprecation of the data_manager option
-if "PANDAS_DATA_MANAGER" in os.environ:
-    warnings.warn(
-        "The env variable PANDAS_DATA_MANAGER is set. The data_manager option is "
-        "deprecated and will be removed in a future version. Only the BlockManager "
-        "will be available. Unset this environment variable to silence this warning.",
-        FutureWarning,
-        stacklevel=2,
-    )
-
 # DeprecationWarning for missing pyarrow
 from pandas.compat.pyarrow import pa_version_under10p1, pa_not_found
 
@@ -232,7 +221,7 @@
     del VERSIONS, pa_msg
 
 # Delete all unnecessary imported modules
-del pa_version_under10p1, pa_not_found, warnings, os
+del pa_version_under10p1, pa_not_found, warnings
 
 # module level doc-string
 __doc__ = """
 
@@ -32,19 +32,11 @@
 
 
 def using_copy_on_write() -> bool:
-    _mode_options = _global_config["mode"]
-    return (
-        _mode_options["copy_on_write"] is True
-        and _mode_options["data_manager"] == "block"
-    )
+    return True
 
 
 def warn_copy_on_write() -> bool:
-    _mode_options = _global_config["mode"]
-    return (
-        _mode_options["copy_on_write"] == "warn"
-        and _mode_options["data_manager"] == "block"
-    )
+    return False
 
 
 def using_nullable_dtypes() -> bool:
 
@@ -61,9 +61,7 @@
     )
     from pandas.core.indexes.base import Index
     from pandas.core.internals import (
-        ArrayManager,
         BlockManager,
-        SingleArrayManager,
         SingleBlockManager,
     )
     from pandas.core.resample import Resampler
@@ -382,11 +380,7 @@ def closed(self) -> bool:
 ]
 
 # internals
-Manager = Union[
-    "ArrayManager", "SingleArrayManager", "BlockManager", "SingleBlockManager"
-]
-SingleManager = Union["SingleArrayManager", "SingleBlockManager"]
-Manager2D = Union["ArrayManager", "BlockManager"]
+Manager = Union["BlockManager", "SingleBlockManager"]
 
 # indexing
 # PositionalIndexer -> valid 1D positional indexer, e.g. can pass
 
@@ -48,8 +48,6 @@
     utc,
 )
 
-from pandas._config.config import _get_option
-
 import pandas.util._test_decorators as td
 
 from pandas.core.dtypes.dtypes import (
@@ -1965,21 +1963,15 @@ def using_copy_on_write() -> bool:
     """
     Fixture to check if Copy-on-Write is enabled.
     """
-    return (
-        pd.options.mode.copy_on_write is True
-        and _get_option("mode.data_manager", silent=True) == "block"
-    )
+    return True
 
 
 @pytest.fixture
 def warn_copy_on_write() -> bool:
     """
     Fixture to check if Copy-on-Write is in warning mode.
     """
-    return (
-        pd.options.mode.copy_on_write == "warn"
-        and _get_option("mode.data_manager", silent=True) == "block"
-    )
+    return False
 
 
 @pytest.fixture
 
@@ -1256,7 +1256,7 @@ def series_generator(self) -> Generator[Series, None, None]:
         ser = self.obj._ixs(0, axis=0)
         mgr = ser._mgr
 
-        is_view = mgr.blocks[0].refs.has_reference()  # type: ignore[union-attr]
+        is_view = mgr.blocks[0].refs.has_reference()
 
         if isinstance(ser.dtype, ExtensionDtype):
             # values will be incorrect for this block
@@ -1278,7 +1278,7 @@ def series_generator(self) -> Generator[Series, None, None]:
                     # -> if that happened and `ser` is already a copy, then we reset
                     # the refs here to avoid triggering a unnecessary CoW inside the
                     # applied function (https://github.com/pandas-dev/pandas/pull/56212)
-                    mgr.blocks[0].refs = BlockValuesRefs(mgr.blocks[0])  # type: ignore[union-attr]
+                    mgr.blocks[0].refs = BlockValuesRefs(mgr.blocks[0])
                 yield ser
 
     @staticmethod
 
@@ -263,10 +263,7 @@ def array_ufunc(self, ufunc: np.ufunc, method: str, *inputs: Any, **kwargs: Any)
         Series,
     )
     from pandas.core.generic import NDFrame
-    from pandas.core.internals import (
-        ArrayManager,
-        BlockManager,
-    )
+    from pandas.core.internals import BlockManager
 
     cls = type(self)
 
@@ -350,7 +347,7 @@ def _reconstruct(result):
             if method == "outer":
                 raise NotImplementedError
             return result
-        if isinstance(result, (BlockManager, ArrayManager)):
+        if isinstance(result, BlockManager):
             # we went through BlockManager.apply e.g. np.sqrt
             result = self._constructor_from_mgr(result, axes=result.axes)
         else:
 
@@ -818,7 +818,7 @@ def argsort(
         na_position : {'first', 'last'}, default 'last'
             If ``'first'``, put ``NaN`` values at the beginning.
             If ``'last'``, put ``NaN`` values at the end.
-        *args, **kwargs:
+        **kwargs
             Passed through to :func:`numpy.argsort`.
 
         Returns