pandas-dev · tpaxman · Jun 27, 2023 · Jun 27, 2023 · Jun 27, 2023 · Jun 28, 2023
diff --git a/pandas/core/generic.py b/pandas/core/generic.py
@@ -6694,6 +6694,7 @@ def infer_objects(self, copy: bool_t | None = None) -> Self:
         return res.__finalize__(self, method="infer_objects")
 
     @final
+    @doc(dtype_backend_options=_shared_docs["dtype_backend_options"])
     def convert_dtypes(
         self,
         infer_objects: bool_t = True,
@@ -6722,13 +6723,8 @@ def convert_dtypes(
             dtypes if the floats can be faithfully casted to integers.
 
             .. versionadded:: 1.2.0
-        dtype_backend : {"numpy_nullable", "pyarrow"}, default "numpy_nullable"
-            Which dtype_backend to use, e.g. whether a DataFrame should use nullable
-            dtypes for all dtypes that have a nullable
-            implementation when "numpy_nullable" is set, pyarrow is used for all
-            dtypes if "pyarrow" is set.
 
-            The dtype_backends are still experimential.
+        {dtype_backend_options}
 
             .. versionadded:: 2.0
 
@@ -6774,14 +6770,14 @@ def convert_dtypes(
         Examples
         --------
         >>> df = pd.DataFrame(
-        ...     {
+        ...     {{
         ...         "a": pd.Series([1, 2, 3], dtype=np.dtype("int32")),
         ...         "b": pd.Series(["x", "y", "z"], dtype=np.dtype("O")),
         ...         "c": pd.Series([True, False, np.nan], dtype=np.dtype("O")),
         ...         "d": pd.Series(["h", "i", np.nan], dtype=np.dtype("O")),
         ...         "e": pd.Series([10, np.nan, 20], dtype=np.dtype("float")),
         ...         "f": pd.Series([np.nan, 100.5, 200], dtype=np.dtype("float")),
-        ...     }
+        ...     }}
         ... )
 
         Start with a DataFrame with default dtypes.

diff --git a/pandas/core/shared_docs.py b/pandas/core/shared_docs.py
@@ -489,6 +489,15 @@
     .. versionadded:: 1.5.0
         Added support for `.tar` files."""
 
+_shared_docs[
+    "dtype_backend_options"
+] = """dtype_backend : {'numpy_nullable', 'pyarrow'}, default NumPy-backed DataFrame
+    Back-end data type to use. ``'numpy_nullable'`` denotes NumPy-backed arrays where
+    nullable dtypes are used for all data types that have a nullable implementation.
+    ``'pyarrow'`` specifies using PyArrow for all data types.
+
+    These back-ends are still experimental."""
+
 _shared_docs[
     "replace"
 ] = """

diff --git a/pandas/core/tools/numeric.py b/pandas/core/tools/numeric.py
@@ -8,6 +8,7 @@
 import numpy as np
 
 from pandas._libs import lib
+from pandas.util._decorators import doc
 from pandas.util._validators import check_dtype_backend
 
 from pandas.core.dtypes.cast import maybe_downcast_numeric
@@ -30,6 +31,7 @@
 
 from pandas.core.arrays import BaseMaskedArray
 from pandas.core.arrays.string_ import StringDtype
+from pandas.core.shared_docs import _shared_docs
 
 if TYPE_CHECKING:
     from pandas._typing import (
@@ -39,6 +41,7 @@
     )
 
 
+@doc(dtype_backend_options=_shared_docs["dtype_backend_options"])
 def to_numeric(
     arg,
     errors: DateTimeErrorChoices = "raise",
@@ -64,7 +67,7 @@ def to_numeric(
     ----------
     arg : scalar, list, tuple, 1-d array, or Series
         Argument to be converted.
-    errors : {'ignore', 'raise', 'coerce'}, default 'raise'
+    errors : {{'ignore', 'raise', 'coerce'}}, default 'raise'
         - If 'raise', then invalid parsing will raise an exception.
         - If 'coerce', then invalid parsing will be set as NaN.
         - If 'ignore', then invalid parsing will return the input.
@@ -88,13 +91,7 @@ def to_numeric(
         the dtype it is to be cast to, so if none of the dtypes
         checked satisfy that specification, no downcasting will be
         performed on the data.
-    dtype_backend : {"numpy_nullable", "pyarrow"}, defaults to NumPy backed DataFrames
-        Which dtype_backend to use, e.g. whether a DataFrame should have NumPy
-        arrays, nullable dtypes are used for all dtypes that have a nullable
-        implementation when "numpy_nullable" is set, pyarrow is used for all
-        dtypes if "pyarrow" is set.
-
-        The dtype_backends are still experimential.
+    {dtype_backend_options}
 
         .. versionadded:: 2.0
 

diff --git a/pandas/io/clipboards.py b/pandas/io/clipboards.py
@@ -6,6 +6,7 @@
 import warnings
 
 from pandas._libs import lib
+from pandas.util._decorators import doc
 from pandas.util._exceptions import find_stack_level
 from pandas.util._validators import check_dtype_backend
 
@@ -15,11 +16,13 @@
     get_option,
     option_context,
 )
+from pandas.core.shared_docs import _shared_docs
 
 if TYPE_CHECKING:
     from pandas._typing import DtypeBackend
 
 
+@doc(dtype_backend_options=_shared_docs["dtype_backend_options"])
 def read_clipboard(
     sep: str = r"\s+",
     dtype_backend: DtypeBackend | lib.NoDefault = lib.no_default,
@@ -37,13 +40,7 @@ def read_clipboard(
         A string or regex delimiter. The default of ``'\\s+'`` denotes
         one or more whitespace characters.
 
-    dtype_backend : {"numpy_nullable", "pyarrow"}, defaults to NumPy backed DataFrames
-        Which dtype_backend to use, e.g., whether a DataFrame should have NumPy
-        arrays, nullable dtypes are used for all dtypes that have a nullable
-        implementation when ``'numpy_nullable'`` is set, pyarrow is used for all
-        dtypes if ``'pyarrow'`` is set.
-
-        The dtype_backends are still experimental.
+    {dtype_backend_options}
 
         .. versionadded:: 2.0
 

@@ -285,13 +285,7 @@
 
     .. versionadded:: 1.2.0
 
-dtype_backend : {{"numpy_nullable", "pyarrow"}}, defaults to NumPy backed DataFrames
-    Which dtype_backend to use, e.g. whether a DataFrame should have NumPy
-    arrays, nullable dtypes are used for all dtypes that have a nullable
-    implementation when "numpy_nullable" is set, pyarrow is used for all
-    dtypes if "pyarrow" is set.
-
-    The dtype_backends are still experimential.
+{dtype_backend_options}
 
     .. versionadded:: 2.0
 
@@ -451,7 +445,10 @@ def read_excel(
     ...
 
 
-@doc(storage_options=_shared_docs["storage_options"])
+@doc(
+    storage_options=_shared_docs["storage_options"],
+    dtype_backend_options=_shared_docs["dtype_backend_options"],
+)
 @Appender(_read_excel_doc)
 def read_excel(
     io,

diff --git a/pandas/io/feather_format.py b/pandas/io/feather_format.py
@@ -62,7 +62,10 @@ def to_feather(
         feather.write_feather(df, handles.handle, **kwargs)
 
 
-@doc(storage_options=_shared_docs["storage_options"])
+@doc(
+    storage_options=_shared_docs["storage_options"],
+    dtype_backend_options=_shared_docs["dtype_backend_options"],
+)
 def read_feather(
     path: FilePath | ReadBuffer[bytes],
     columns: Sequence[Hashable] | None = None,
@@ -88,13 +91,7 @@ def read_feather(
 
         .. versionadded:: 1.2.0
 
-    dtype_backend : {{"numpy_nullable", "pyarrow"}}, defaults to NumPy backed DataFrames
-        Which dtype_backend to use, e.g. whether a DataFrame should have NumPy
-        arrays, nullable dtypes are used for all dtypes that have a nullable
-        implementation when "numpy_nullable" is set, pyarrow is used for all
-        dtypes if "pyarrow" is set.
-
-        The dtype_backends are still experimential.
+    {dtype_backend_options}
 
         .. versionadded:: 2.0
 

diff --git a/pandas/io/html.py b/pandas/io/html.py
@@ -25,6 +25,7 @@
     AbstractMethodError,
     EmptyDataError,
 )
+from pandas.util._decorators import doc
 from pandas.util._exceptions import find_stack_level
 from pandas.util._validators import check_dtype_backend
 
@@ -34,6 +35,7 @@
 from pandas.core.indexes.base import Index
 from pandas.core.indexes.multi import MultiIndex
 from pandas.core.series import Series
+from pandas.core.shared_docs import _shared_docs
 
 from pandas.io.common import (
     file_exists,
@@ -352,13 +354,13 @@ def _parse_tfoot_tr(self, table):
         """
         raise AbstractMethodError(self)
 
-    def _parse_tables(self, doc, match, attrs):
+    def _parse_tables(self, dom_doc, match, attrs):
         """
         Return all tables from the parsed DOM.
 
         Parameters
         ----------
-        doc : the DOM from which to parse the table element.
+        dom_doc : the DOM from which to parse the table element.
 
         match : str or regular expression
             The text to search for in the DOM tree.
@@ -583,9 +585,9 @@ def __init__(self, *args, **kwargs) -> None:
 
         self._strainer = SoupStrainer("table")
 
-    def _parse_tables(self, doc, match, attrs):
+    def _parse_tables(self, dom_doc, match, attrs):
         element_name = self._strainer.name
-        tables = doc.find_all(element_name, attrs=attrs)
+        tables = dom_doc.find_all(element_name, attrs=attrs)
         if not tables:
             raise ValueError("No tables found")
 
@@ -715,7 +717,7 @@ def _parse_td(self, row):
         # <thead> or <tfoot> (see _parse_thead_tr).
         return row.xpath("./td|./th")
 
-    def _parse_tables(self, doc, match, kwargs):
+    def _parse_tables(self, dom_doc, match, kwargs):
         pattern = match.pattern
 
         # 1. check all descendants for the given pattern and only search tables
@@ -727,7 +729,7 @@ def _parse_tables(self, doc, match, kwargs):
         if kwargs:
             xpath_expr += _build_xpath_expr(kwargs)
 
-        tables = doc.xpath(xpath_expr, namespaces=_re_namespace)
+        tables = dom_doc.xpath(xpath_expr, namespaces=_re_namespace)
 
         tables = self._handle_hidden_tables(tables, "attrib")
         if self.displayed_only:
@@ -995,6 +997,7 @@ def _parse(flavor, io, match, attrs, encoding, displayed_only, extract_links, **
     return ret
 
 
+@doc(dtype_backend_options=_shared_docs["dtype_backend_options"])
 def read_html(
     io: FilePath | ReadBuffer[str],
     *,
@@ -1064,13 +1067,13 @@ def read_html(
         passed to lxml or Beautiful Soup. However, these attributes must be
         valid HTML table attributes to work correctly. For example, ::
 
-            attrs = {'id': 'table'}
+            attrs = {{'id': 'table'}}
 
         is a valid attribute dictionary because the 'id' HTML tag attribute is
         a valid HTML attribute for *any* HTML tag as per `this document
         <https://html.spec.whatwg.org/multipage/dom.html#global-attributes>`__. ::
 
-            attrs = {'asdf': 'table'}
+            attrs = {{'asdf': 'table'}}
 
         is *not* a valid attribute dictionary because 'asdf' is not a valid
         HTML attribute even if it is a valid XML attribute.  Valid HTML 4.01
@@ -1112,19 +1115,13 @@ def read_html(
     displayed_only : bool, default True
         Whether elements with "display: none" should be parsed.
 
-    extract_links : {None, "all", "header", "body", "footer"}
+    extract_links : {{None, "all", "header", "body", "footer"}}
         Table elements in the specified section(s) with <a> tags will have their
         href extracted.
 
         .. versionadded:: 1.5.0
 
-    dtype_backend : {"numpy_nullable", "pyarrow"}, defaults to NumPy backed DataFrames
-        Which dtype_backend to use, e.g. whether a DataFrame should have NumPy
-        arrays, nullable dtypes are used for all dtypes that have a nullable
-        implementation when "numpy_nullable" is set, pyarrow is used for all
-        dtypes if "pyarrow" is set.
-
-        The dtype_backends are still experimential.
+    {dtype_backend_options}
 
         .. versionadded:: 2.0
 

diff --git a/pandas/io/json/_json.py b/pandas/io/json/_json.py
@@ -496,6 +496,7 @@ def read_json(
 
 
 @doc(
+    dtype_backend_options=_shared_docs["dtype_backend_options"],
     storage_options=_shared_docs["storage_options"],
     decompression_options=_shared_docs["decompression_options"] % "path_or_buf",
 )
@@ -660,13 +661,7 @@ def read_json(
 
         .. versionadded:: 1.2.0
 
-    dtype_backend : {{"numpy_nullable", "pyarrow"}}, defaults to NumPy backed DataFrames
-        Which dtype_backend to use, e.g. whether a DataFrame should have NumPy
-        arrays, nullable dtypes are used for all dtypes that have a nullable
-        implementation when "numpy_nullable" is set, pyarrow is used for all
-        dtypes if "pyarrow" is set.
-
-        The dtype_backends are still experimential.
+    {dtype_backend_options}
 
         .. versionadded:: 2.0
 

diff --git a/pandas/io/orc.py b/pandas/io/orc.py
@@ -12,6 +12,7 @@
 from pandas._libs import lib
 from pandas.compat import pa_version_under8p0
 from pandas.compat._optional import import_optional_dependency
+from pandas.util._decorators import doc
 from pandas.util._validators import check_dtype_backend
 
 from pandas.core.dtypes.common import is_unsigned_integer_dtype
@@ -23,6 +24,7 @@
 
 import pandas as pd
 from pandas.core.indexes.api import default_index
+from pandas.core.shared_docs import _shared_docs
 
 from pandas.io.common import (
     get_handle,
@@ -40,6 +42,7 @@
     from pandas.core.frame import DataFrame
 
 
+@doc(dtype_backend_options=_shared_docs["dtype_backend_options"])
 def read_orc(
     path: FilePath | ReadBuffer[bytes],
     columns: list[str] | None = None,
@@ -63,13 +66,7 @@ def read_orc(
         Output always follows the ordering of the file and not the columns list.
         This mirrors the original behaviour of
         :external+pyarrow:py:meth:`pyarrow.orc.ORCFile.read`.
-    dtype_backend : {"numpy_nullable", "pyarrow"}, defaults to NumPy backed DataFrames
-        Which dtype_backend to use, e.g. whether a DataFrame should have NumPy
-        arrays, nullable dtypes are used for all dtypes that have a nullable
-        implementation when "numpy_nullable" is set, pyarrow is used for all
-        dtypes if "pyarrow" is set.
-
-        The dtype_backends are still experimential.
+    {dtype_backend_options}
 
         .. versionadded:: 2.0
 

diff --git a/pandas/io/parquet.py b/pandas/io/parquet.py
@@ -478,7 +478,10 @@ def to_parquet(
         return None
 
 
-@doc(storage_options=_shared_docs["storage_options"])
+@doc(
+    dtype_backend_options=_shared_docs["dtype_backend_options"],
+    storage_options=_shared_docs["storage_options"],
+)
 def read_parquet(
     path: FilePath | ReadBuffer[bytes],
     engine: str = "auto",
@@ -533,13 +536,7 @@ def read_parquet(
 
         .. deprecated:: 2.0
 
-    dtype_backend : {{"numpy_nullable", "pyarrow"}}, defaults to NumPy backed DataFrames
-        Which dtype_backend to use, e.g. whether a DataFrame should have NumPy
-        arrays, nullable dtypes are used for all dtypes that have a nullable
-        implementation when "numpy_nullable" is set, pyarrow is used for all
-        dtypes if "pyarrow" is set.
-
-        The dtype_backends are still experimential.
+    {dtype_backend_options}
 
         .. versionadded:: 2.0