Remove excess comments. Reverse error type change to avoid api changes. Move nan_rep tests into separate function.

JakeTT404 · JakeTT404 · commit 4627462965e8 · 2025-02-03T23:57:42.000Z
diff --git a/pandas/io/pytables.py b/pandas/io/pytables.py
@@ -3524,14 +3524,12 @@ def validate(self, other) -> None:
                     # Value of type "Optional[Any]" is not indexable  [index]
                     oax = ov[i]  # type: ignore[index]
                     if sax != oax:
-                        ## Raise clearer error if mismatching type on values_axes
                         if c == "values_axes" and sax.kind != oax.kind:
-                            raise TypeError(
+                            raise ValueError(
                                 f"Cannot serialize the column [{oax.values[0]}] "
                                 f"because its data contents are not [{sax.kind}] "
                                 f"but [{oax.kind}] object dtype"
                             )
-                        # Fallback if other source of difference
                         raise ValueError(
                             f"invalid combination of [{c}] on appending data "
                             f"[{sax}] vs current table [{oax}]"
diff --git a/pandas/tests/io/pytables/test_append.py b/pandas/tests/io/pytables/test_append.py
@@ -421,14 +421,6 @@ def check_col(key, name, size):
         with pytest.raises(ValueError, match=msg):
             store.append("df_new", df_new)
 
-        # bigger NaN representation on next append
-        df_new = DataFrame([[124, "a"], [346, "b"]])
-        store.append("df_new2", df_new)
-        df_new = DataFrame([[124, None], [346, "b"]])
-        msg = "NaN representation is too large for existing column size"
-        with pytest.raises(ValueError, match=msg):
-            store.append("df_new2", df_new)
-
         # min_itemsize on Series index (GH 11412)
         df = DataFrame(
             {
@@ -835,7 +827,7 @@ def test_append_raise(setup_path):
             "because its data contents are not [string] "
             "but [datetime64[s]] object dtype"
         )
-        with pytest.raises(TypeError, match=msg):
+        with pytest.raises(ValueError, match=msg):
             store.append("df", df)
 
 
@@ -1002,3 +994,29 @@ def test_append_to_multiple_min_itemsize(setup_path):
         )
         result = store.select_as_multiple(["index", "nums", "strs"])
         tm.assert_frame_equal(result, expected, check_index_type=True)
+
+
+def test_append_string_nan_rep(setup_path):
+    # GH 16300
+    df = DataFrame({"A": "a", "B": "foo"}, index=np.arange(10))
+    df_nan = df.copy()
+    df_nan.loc[0:4, :] = np.nan
+    msg = "NaN representation is too large for existing column size"
+
+    with ensure_clean_store(setup_path) as store:
+        # string column too small
+        store.append("sa", df["A"])
+        with pytest.raises(ValueError, match=msg):
+            store.append("sa", df_nan["A"])
+
+        # nan_rep too big
+        store.append("sb", df["B"], nan_rep="bars")
+        with pytest.raises(ValueError, match=msg):
+            store.append("sb", df_nan["B"])
+
+        # smaller modified nan_rep
+        store.append("sc", df["A"], nan_rep="n")
+        store.append("sc", df_nan["A"])
+        result = store["sc"]
+        expected = concat([df["A"], df_nan["A"]])
+        tm.assert_series_equal(result, expected)
diff --git a/pandas/tests/io/pytables/test_round_trip.py b/pandas/tests/io/pytables/test_round_trip.py
@@ -217,7 +217,7 @@ def test_table_values_dtypes_roundtrip(setup_path):
             "because its data contents are not [float] "
             "but [integer] object dtype"
         )
-        with pytest.raises(TypeError, match=msg):
+        with pytest.raises(ValueError, match=msg):
             store.append("df_i8", df1)
 
         # check creation/storage/retrieval of float32 (a bit hacky to

Original file line number	Diff line number	Diff line change
`@@ -217,7 +217,7 @@ def test_table_values_dtypes_roundtrip(setup_path):`
`217`	`217`	`"because its data contents are not [float] "`
`218`	`218`	`"but [integer] object dtype"`
`219`	`219`	`)`
`220`		`- with pytest.raises(TypeError, match=msg):`
	`220`	`+ with pytest.raises(ValueError, match=msg):`
`221`	`221`	`store.append("df_i8", df1)`
`222`	`222`
`223`	`223`	`# check creation/storage/retrieval of float32 (a bit hacky to`