pandas-dev
diff --git a/‎.github/workflows/unit-tests.yml
Lines changed: 5 additions & 0 deletions b/‎.github/workflows/unit-tests.yml
Lines changed: 5 additions & 0 deletions
diff --git a/‎README.md
Lines changed: 1 addition & 1 deletion b/‎README.md
Lines changed: 1 addition & 1 deletion
diff --git a/‎ci/code_checks.sh
Lines changed: 0 additions & 1 deletion b/‎ci/code_checks.sh
Lines changed: 0 additions & 1 deletion
diff --git a/‎ci/run_tests.sh
Lines changed: 6 additions & 0 deletions b/‎ci/run_tests.sh
Lines changed: 6 additions & 0 deletions
diff --git a/‎pandas/_config/__init__.py
Lines changed: 1 addition & 1 deletion b/‎pandas/_config/__init__.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎pandas/_libs/lib.pyx
Lines changed: 2 additions & 2 deletions b/‎pandas/_libs/lib.pyx
Lines changed: 2 additions & 2 deletions
diff --git a/‎pandas/core/config_init.py
Lines changed: 1 addition & 1 deletion b/‎pandas/core/config_init.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎pandas/core/construction.py
Lines changed: 3 additions & 7 deletions b/‎pandas/core/construction.py
Lines changed: 3 additions & 7 deletions
diff --git a/‎pandas/core/dtypes/cast.py
Lines changed: 2 additions & 2 deletions b/‎pandas/core/dtypes/cast.py
Lines changed: 2 additions & 2 deletions
diff --git a/‎pandas/core/dtypes/concat.py
Lines changed: 6 additions & 0 deletions b/‎pandas/core/dtypes/concat.py
Lines changed: 6 additions & 0 deletions
@@ -57,6 +57,10 @@ jobs:
             # Also install zh_CN (its encoding is gb2312) but do not activate it.
             # It will be temporarily activated during tests with locale.setlocale
             extra_loc: "zh_CN"
+          - name: "Future infer strings"
+            env_file: actions-311.yaml
+            pattern: "not slow and not network and not single_cpu"
+            pandas_future_infer_string: "1"
           - name: "Pypy"
             env_file: actions-pypy-39.yaml
             pattern: "not slow and not network and not single_cpu"
@@ -75,6 +79,7 @@ jobs:
       LANG: ${{ matrix.lang || 'C.UTF-8' }}
       LC_ALL: ${{ matrix.lc_all || '' }}
       PANDAS_CI: '1'
+      PANDAS_FUTURE_INFER_STRING: ${{ matrix.pandas_future_infer_string || '0' }}
       TEST_ARGS: ${{ matrix.test_args || '' }}
       PYTEST_WORKERS: 'auto'
       PYTEST_TARGET: ${{ matrix.pytest_target || 'pandas' }}
 
@@ -96,7 +96,7 @@ The source code is currently hosted on GitHub at:
 https://github.com/pandas-dev/pandas
 
 Binary installers for the latest released version are available at the [Python
-Package Index (PyPI)](https://pypi.org/project/pandas) and on [Conda](https://docs.conda.io/en/latest/).
+Package Index (PyPI)](https://pypi.org/project/pandas) and on [Conda](https://anaconda.org/conda-forge/pandas).
 
 ```sh
 # conda
 
@@ -306,7 +306,6 @@ if [[ -z "$CHECK" || "$CHECK" == "docstrings" ]]; then
         -i "pandas.api.types.is_sparse SA01" \
         -i "pandas.api.types.is_timedelta64_ns_dtype SA01" \
         -i "pandas.api.types.pandas_dtype PR07,RT03,SA01" \
-        -i "pandas.api.types.union_categoricals RT03,SA01" \
         -i "pandas.arrays.ArrowExtensionArray PR07,SA01" \
         -i "pandas.arrays.BooleanArray SA01" \
         -i "pandas.arrays.DatetimeArray SA01" \
 
@@ -16,5 +16,11 @@ if [[ "$PATTERN" ]]; then
   PYTEST_CMD="$PYTEST_CMD -m \"$PATTERN\""
 fi
 
+# temporarily let pytest always succeed (many tests are not yet passing in the
+# build enabling the future string dtype)
+if [[ "$PANDAS_FUTURE_INFER_STRING" == "1" ]]; then
+  PYTEST_CMD="$PYTEST_CMD || true"
+fi
+
 echo $PYTEST_CMD
 sh -c "$PYTEST_CMD"
@@ -30,6 +30,6 @@
 from pandas._config.display import detect_console_encoding
 
 
-def using_pyarrow_string_dtype() -> bool:
+def using_string_dtype() -> bool:
     _mode_options = _global_config["future"]
     return _mode_options["infer_string"]
@@ -37,7 +37,7 @@ from cython cimport (
     floating,
 )
 
-from pandas._config import using_pyarrow_string_dtype
+from pandas._config import using_string_dtype
 
 from pandas._libs.missing import check_na_tuples_nonequal
 
@@ -2699,7 +2699,7 @@ def maybe_convert_objects(ndarray[object] objects,
         seen.object_ = True
 
     elif seen.str_:
-        if using_pyarrow_string_dtype() and is_string_array(objects, skipna=True):
+        if using_string_dtype() and is_string_array(objects, skipna=True):
             from pandas.core.arrays.string_ import StringDtype
 
             dtype = StringDtype(storage="pyarrow_numpy")
 
@@ -858,7 +858,7 @@ def register_converter_cb(key: str) -> None:
 with cf.config_prefix("future"):
     cf.register_option(
         "infer_string",
-        False,
+        True if os.environ.get("PANDAS_FUTURE_INFER_STRING", "0") == "1" else False,
         "Whether to infer sequence of str objects as pyarrow string "
         "dtype, which will be the default in pandas 3.0 "
         "(at which point this option will be deprecated).",
 
@@ -16,7 +16,7 @@
 import numpy as np
 from numpy import ma
 
-from pandas._config import using_pyarrow_string_dtype
+from pandas._config import using_string_dtype
 
 from pandas._libs import lib
 from pandas._libs.tslibs import (
@@ -571,11 +571,7 @@ def sanitize_array(
     if not is_list_like(data):
         if index is None:
             raise ValueError("index must be specified when data is not list-like")
-        if (
-            isinstance(data, str)
-            and using_pyarrow_string_dtype()
-            and original_dtype is None
-        ):
+        if isinstance(data, str) and using_string_dtype() and original_dtype is None:
             from pandas.core.arrays.string_ import StringDtype
 
             dtype = StringDtype("pyarrow_numpy")
@@ -609,7 +605,7 @@ def sanitize_array(
             subarr = data
             if data.dtype == object and infer_object:
                 subarr = maybe_infer_to_datetimelike(data)
-            elif data.dtype.kind == "U" and using_pyarrow_string_dtype():
+            elif data.dtype.kind == "U" and using_string_dtype():
                 from pandas.core.arrays.string_ import StringDtype
 
                 dtype = StringDtype(storage="pyarrow_numpy")
 
@@ -18,7 +18,7 @@
 
 import numpy as np
 
-from pandas._config import using_pyarrow_string_dtype
+from pandas._config import using_string_dtype
 
 from pandas._libs import (
     Interval,
@@ -798,7 +798,7 @@ def infer_dtype_from_scalar(val) -> tuple[DtypeObj, Any]:
         # coming out as np.str_!
 
         dtype = _dtype_obj
-        if using_pyarrow_string_dtype():
+        if using_string_dtype():
             from pandas.core.arrays.string_ import StringDtype
 
             dtype = StringDtype(storage="pyarrow_numpy")
 
@@ -190,6 +190,7 @@ def union_categoricals(
     Returns
     -------
     Categorical
+        The union of categories being combined.
 
     Raises
     ------
@@ -201,6 +202,11 @@ def union_categoricals(
     ValueError
         Empty list of categoricals passed
 
+    See Also
+    --------
+    CategoricalDtype : Type for categorical data with the categories and orderedness.
+    Categorical : Represent a categorical variable in classic R / S-plus fashion.
+
     Notes
     -----
     To learn more about categories, see `link