Revert to a doc update

rhshadrach · rhshadrach · commit 29295627e1a2 · 2025-07-13T08:46:55.000-04:00
diff --git a/pandas/core/reshape/encoding.py b/pandas/core/reshape/encoding.py
@@ -17,14 +17,12 @@
     is_integer_dtype,
     is_list_like,
     is_object_dtype,
-    is_string_dtype,
     pandas_dtype,
 )
 from pandas.core.dtypes.dtypes import (
     ArrowDtype,
     CategoricalDtype,
 )
-from pandas.core.dtypes.missing import isna
 
 from pandas.core.arrays import SparseArray
 from pandas.core.arrays.categorical import factorize_from_iterable
@@ -38,7 +36,6 @@
 
 if TYPE_CHECKING:
     from pandas._typing import (
-        DtypeObj,
         NpDtype,
     )
 
@@ -395,7 +392,9 @@ def from_dummies(
         The default category is the implied category when a value has none of the
         listed categories specified with a one, i.e. if all dummies in a row are
         zero. Can be a single value for all variables or a dict directly mapping
-        the default categories to a prefix of a variable.
+        the default categories to a prefix of a variable. The default category
+        will be coerced to the dtype of ``data.columns`` if such coercion is
+        lossless, and will raise otherwise.
 
     Returns
     -------
@@ -560,20 +559,9 @@ def from_dummies(
                 "Dummy DataFrame contains multi-assignment(s); "
                 f"First instance in row: {assigned.idxmax()}"
             )
-        dtype: str | DtypeObj = data.columns.dtype
         if any(assigned == 0):
             if isinstance(default_category, dict):
-                value = default_category[prefix]
-                if (
-                    is_string_dtype(data.columns.dtype)
-                    and not isinstance(value, str)
-                    and (is_list_like(value) or not isna(value))
-                ):
-                    # https://github.com/pandas-dev/pandas/pull/60694
-                    # `value` is not a string or NA.
-                    # Using data.columns.dtype would coerce `value` into a string.
-                    dtype = "object"
-                cats.append(value)
+                cats.append(default_category[prefix])
             else:
                 raise ValueError(
                     "Dummy DataFrame contains unassigned value(s); "
@@ -584,7 +572,8 @@ def from_dummies(
             )
         else:
             data_slice = data_to_decode.loc[:, prefix_slice]
-        cats_array = data._constructor_sliced(cats, dtype=dtype)
+        # cats_array = data._constructor_sliced(cats, dtype=dtype)
+        cats_array = data._constructor_sliced(cats, dtype=data.columns.dtype)
         # get indices of True entries along axis=1
         true_values = data_slice.idxmax(axis=1)
         indexer = data_slice.columns.get_indexer_for(true_values)
diff --git a/pandas/tests/reshape/test_from_dummies.py b/pandas/tests/reshape/test_from_dummies.py
@@ -1,7 +1,6 @@
 import numpy as np
 import pytest
 
-import pandas as pd
 from pandas import (
     DataFrame,
     Series,
@@ -334,7 +333,7 @@ def test_no_prefix_string_cats_default_category(
 ):
     dummies = DataFrame({"a": [1, 0, 0], "b": [0, 1, 0]})
     result = from_dummies(dummies, default_category=default_category)
-    expected = DataFrame(expected)
+    expected = DataFrame(expected, dtype=dummies.columns.dtype)
     tm.assert_frame_equal(result, expected)
 
 
@@ -466,14 +465,16 @@ def test_object_dtype_preserved():
     # https://github.com/pandas-dev/pandas/pull/60694
     # When the input has object dtype, the result should as
     # well even when infer_string is True.
+    import pandas as pd
+
+    assert pd.get_option("future.infer_string")
     df = DataFrame(
         {
             "x": [1, 0, 0],
             "y": [0, 1, 0],
         },
     )
     df.columns = df.columns.astype("object")
-    with pd.option_context("future.infer_string", True):
-        result = from_dummies(df, default_category="z")
-        expected = DataFrame({"": ["x", "y", "z"]}, dtype="object")
-        tm.assert_frame_equal(result, expected)
+    result = from_dummies(df, default_category="z")
+    expected = DataFrame({"": ["x", "y", "z"]}, dtype="object")
+    tm.assert_frame_equal(result, expected)