change warnings behavior

dxdc · dxdc · commit 9d68f91e6366 · 2025-09-03T17:27:58.000-05:00
diff --git a/pandas/io/parsers/arrow_parser_wrapper.py b/pandas/io/parsers/arrow_parser_wrapper.py
@@ -6,7 +6,6 @@
 from pandas._libs import lib
 from pandas.compat._optional import import_optional_dependency
 from pandas.errors import (
-    DtypeWarning,
     Pandas4Warning,
     ParserError,
     ParserWarning,
@@ -146,27 +145,26 @@ def handle_warning(invalid_row) -> str:
             if isinstance(self.dtype, dict):
                 column_types = {}
                 for col, col_dtype in self.dtype.items():
+                    # TODO: Category dtypes are not currently handled - may cause issues
+                    # with categorical data preservation in pyarrow engine
+                    if col_dtype == "category":
+                        continue
+
                     try:
                         numpy_dtype = pandas_dtype(col_dtype).type
                         pyarrow_dtype = pa.from_numpy_dtype(numpy_dtype)
                         column_types[col] = pyarrow_dtype
                     except (TypeError, ValueError, pa.ArrowNotImplementedError):
-                        warnings.warn(
-                            f"Column '{col}' has dtype '{col_dtype}', "
-                            "which may not be handled correctly by the pyarrow engine.",
-                            DtypeWarning,
-                            stacklevel=find_stack_level(),
-                        )
+                        # TODO: Unsupported dtypes silently ignored - may cause unexpected
+                        # behavior when pyarrow applies default inference instead of user's dtype
+                        continue
 
                 if column_types:
                     self.convert_options["column_types"] = column_types
             else:
-                warnings.warn(
-                    f"Global dtype '{self.dtype}' not supported with pyarrow engine. "
-                    "Use dtype dictionary instead.",
-                    DtypeWarning,
-                    stacklevel=find_stack_level(),
-                )
+                # TODO: Global dtypes not supported - may cause inconsistent behavior
+                # between engines, especially for leading zero preservation
+                pass
 
         self.read_options = {
             "autogenerate_column_names": self.header is None,
diff --git a/pandas/tests/io/parser/test_preserve_leading_zeros.py b/pandas/tests/io/parser/test_preserve_leading_zeros.py
@@ -2,10 +2,6 @@
 
 import pytest
 
-from pandas.errors import DtypeWarning
-
-import pandas._testing as tm
-
 
 def test_leading_zeros_preserved_with_dtype_str(all_parsers, request):
     # GH#57666: pyarrow engine strips leading zeros when dtype=str is passed
@@ -20,19 +16,10 @@ def test_leading_zeros_preserved_with_dtype_str(all_parsers, request):
 EF,000023607,ghi,0205
 GH,100102040,jkl,0205"""
 
-    if engine_name == "pyarrow":
-        with tm.assert_produces_warning(
-            DtypeWarning, match="not supported with pyarrow engine"
-        ):
-            result = parser.read_csv(
-                StringIO(data),
-                dtype=str,
-            )
-    else:
-        result = parser.read_csv(
-            StringIO(data),
-            dtype=str,
-        )
+    result = parser.read_csv(
+        StringIO(data),
+        dtype=str,
+    )
 
     try:
         assert result.shape == (4, 4)