make release-tag: Merge branch 'main' into stable

sarahmish · sarahmish · commit 996f2aebb9b7 · 2026-02-13T13:04:39.000-05:00
diff --git a/HISTORY.md b/HISTORY.md
@@ -1,5 +1,16 @@
 # History
 
+## v0.27.1 - 2026-02-13
+
+### Bugs Fixed
+
+* `Meets Threshold?` column in QualityReport details is showing numerical values instead of booleans - Issue [#843](https://github.com/sdv-dev/SDMetrics/issues/843) by @fealho
+
+### Maintenance
+
+* Update README and other meta information to point to the DataCebo forum - Issue [#845](https://github.com/sdv-dev/SDMetrics/issues/845) by @pvk-developer
+* Update license information in pyproject.toml to use new format - Issue [#814](https://github.com/sdv-dev/SDMetrics/issues/814) by @pvk-developer
+
 ## v0.27.0 - 2026-01-29
 
 ### New Features
diff --git a/README.md b/README.md
@@ -9,7 +9,7 @@
 [![Downloads](https://pepy.tech/badge/sdmetrics)](https://pepy.tech/project/sdmetrics)
 [![Tests](https://github.com/sdv-dev/SDMetrics/workflows/Run%20Tests/badge.svg)](https://github.com/sdv-dev/SDMetrics/actions?query=workflow%3A%22Run+Tests%22+branch%3Amain)
 [![Coverage Status](https://codecov.io/gh/sdv-dev/SDMetrics/branch/main/graph/badge.svg)](https://codecov.io/gh/sdv-dev/SDMetrics)
-[![Slack](https://img.shields.io/badge/Community-Slack-blue?style=plastic&logo=slack)](https://bit.ly/sdv-slack-invite)
+[![Forum](https://img.shields.io/badge/Forum-Join%20now!-36C5F0)](https://forum.datacebo.com)
 [![Tutorial](https://img.shields.io/badge/Demo-Get%20started-orange?style=plastic&logo=googlecolab)](https://bit.ly/sdmetrics-demo)
 [![DOI](https://zenodo.org/badge/DOI/10.5281/zenodo.14279167.svg)](https://doi.org/10.5281/zenodo.14279167)
 
diff --git a/latest_requirements.txt b/latest_requirements.txt
@@ -1,7 +1,7 @@
-copulas==0.14.0
+copulas==0.14.1
 numpy==2.3.5
 pandas==2.3.3
 plotly==6.5.2
 scikit-learn==1.8.0
 scipy==1.17.0
-tqdm==4.67.1
+tqdm==4.67.3
diff --git a/pyproject.toml b/pyproject.toml
@@ -5,7 +5,6 @@ authors = [{ name = "MIT Data To AI Lab", email = "dailabmit@gmail.com" }]
 classifiers = [
     'Development Status :: 2 - Pre-Alpha',
     'Intended Audience :: Developers',
-    'License :: OSI Approved :: MIT License',
     'Natural Language :: English',
     'Programming Language :: Python :: 3',
     'Programming Language :: Python :: 3.9',
@@ -17,7 +16,8 @@ classifiers = [
 ]
 keywords = ['sdmetrics', 'SDMetrics']
 dynamic = ['version']
-license = { text = 'MIT license' }
+license = 'MIT'
+license-files = ['LICENSE']
 requires-python = ">=3.9,<3.15"
 readme = 'README.md'
 dependencies = [
@@ -53,7 +53,7 @@ dependencies = [
 "Issue Tracker" = "https://github.com/sdv-dev/SDMetrics/issues"
 "Changes" = "https://github.com/sdv-dev/SDMetrics/blob/main/HISTORY.md"
 "Twitter" = "https://twitter.com/sdv_dev"
-"Chat" = "https://bit.ly/sdv-slack-invite"
+"Chat" = "https://forum.datacebo.com/"
 
 [project.entry-points]
 sdmetrics = { main = 'sdmetrics.cli.__main__:main' }
@@ -105,7 +105,6 @@ dev = [
 
 [tool.setuptools]
 include-package-data = true
-license-files = ['LICENSE']
 
 [tool.setuptools.packages.find]
 include = ['sdmetrics', 'sdmetrics.*']
@@ -149,7 +148,7 @@ convention = 'google'
 add-ignore = ['D107', 'D407', 'D417']
 
 [tool.bumpversion]
-current_version = "0.27.0"
+current_version = "0.27.1.dev1"
 parse = '(?P<major>\d+)\.(?P<minor>\d+)\.(?P<patch>\d+)(\.(?P<release>[a-z]+)(?P<candidate>\d+))?'
 serialize = [
     '{major}.{minor}.{patch}.{release}{candidate}',
diff --git a/sdmetrics/__init__.py b/sdmetrics/__init__.py
@@ -4,7 +4,7 @@
 
 __author__ = 'MIT Data To AI Lab'
 __email__ = 'dailabmit@gmail.com'
-__version__ = '0.27.0'
+__version__ = '0.27.1.dev1'
 
 import sys
 import warnings as python_warnings
diff --git a/sdmetrics/reports/single_table/_properties/column_pair_trends.py b/sdmetrics/reports/single_table/_properties/column_pair_trends.py
@@ -392,6 +392,7 @@ def _generate_details(
             'Meets Threshold?': meets_threshold,
             'Error': error_messages,
         })
+        result['Meets Threshold?'] = result['Meets Threshold?'].astype('boolean')
 
         if result['Error'].isna().all():
             result = result.drop('Error', axis=1)
diff --git a/static_code_analysis.txt b/static_code_analysis.txt
@@ -1,4 +1,4 @@
-Run started:2026-01-29 21:43:48.344046+00:00
+Run started:2026-02-13 15:55:31.917050+00:00
 
 Test results:
 >> Issue: [B101:assert_used] Use of assert detected. The enclosed code will be removed when compiling to optimised byte code.
@@ -117,7 +117,7 @@ Test results:
 --------------------------------------------------
 
 Code scanned:
-	Total lines of code: 12188
+	Total lines of code: 12189
 	Total lines skipped (#nosec): 0
 	Total potential issues skipped due to specifically being disabled (e.g., #nosec BXXX): 0
 
diff --git a/tests/integration/reports/multi_table/test_quality_report.py b/tests/integration/reports/multi_table/test_quality_report.py
@@ -142,7 +142,7 @@ def test_multi_table_quality_report():
         'Real Correlation': [np.nan],
         'Synthetic Correlation': [np.nan],
         'Real Association': [np.nan],
-        'Meets Threshold?': [True],
+        'Meets Threshold?': pd.Series([True], dtype='boolean'),
     })
     pd.testing.assert_frame_equal(details[1], expected_df_1)
 
@@ -176,7 +176,7 @@ def test_multi_table_quality_report():
         'Real Correlation': [np.nan, np.nan, np.nan, np.nan, np.nan, np.nan],
         'Synthetic Correlation': [np.nan, np.nan, np.nan, np.nan, np.nan, np.nan],
         'Real Association': [np.nan, np.nan, np.nan, np.nan, np.nan, np.nan],
-        'Meets Threshold?': [True, True, True, True, True, True],
+        'Meets Threshold?': pd.Series([True, True, True, True, True, True], dtype='boolean'),
     })
     pd.testing.assert_frame_equal(details[3], expected_df_3)
     pd.testing.assert_frame_equal(details[7], expected_df_3)
@@ -205,7 +205,7 @@ def test_multi_table_quality_report():
         'Real Correlation': [np.nan, 0.946664, 0.966247, 0.862622],
         'Synthetic Correlation': [np.nan, 0.926925, 0.936853, 0.798384],
         'Real Association': [np.nan, np.nan, np.nan, np.nan],
-        'Meets Threshold?': [True, True, True, True],
+        'Meets Threshold?': pd.Series([True, True, True, True], dtype='boolean'),
     })
     pd.testing.assert_frame_equal(details[5], expected_df_4)
 
diff --git a/tests/integration/reports/single_table/_properties/test_column_pair_trends.py b/tests/integration/reports/single_table/_properties/test_column_pair_trends.py
@@ -61,7 +61,7 @@ def test_get_score(self):
             'Real Correlation': [0.04735340044317632, np.nan, np.nan, np.nan, np.nan, np.nan],
             'Synthetic Correlation': [-0.11506297326956302, np.nan, np.nan, np.nan, np.nan, np.nan],
             'Real Association': [np.nan] * 6,
-            'Meets Threshold?': [True] * 6,
+            'Meets Threshold?': pd.Series([True] * 6, dtype='boolean'),
         }
         expected_details = pd.DataFrame(expected_details_dict)
         pd.testing.assert_frame_equal(column_pair_trends.details, expected_details)
@@ -151,7 +151,7 @@ def test_only_categorical_columns(self):
             'Real Correlation': [np.nan] * 6,
             'Synthetic Correlation': [np.nan] * 6,
             'Real Association': [np.nan] * 6,
-            'Meets Threshold?': [True] * 6,
+            'Meets Threshold?': pd.Series([True] * 6, dtype='boolean'),
         }
         expected_details = pd.DataFrame(expected_details_dict)
         pd.testing.assert_frame_equal(column_pair_trends.details, expected_details)
@@ -187,7 +187,7 @@ def test_real_association_threshold_filters_pairs(self):
             'Real Correlation': [np.nan, np.nan, np.nan],
             'Synthetic Correlation': [np.nan, np.nan, np.nan],
             'Real Association': [0.0, 1.0, 0.0],
-            'Meets Threshold?': [False, True, False],
+            'Meets Threshold?': pd.Series([False, True, False], dtype='boolean'),
         })
         pd.testing.assert_frame_equal(column_pair_trends.details, expected_details)
         assert score == 1.0
diff --git a/tests/integration/reports/single_table/test_quality_report.py b/tests/integration/reports/single_table/test_quality_report.py
@@ -146,7 +146,7 @@ def test_report_end_to_end(self):
                 np.nan,
             ],
             'Real Association': [np.nan] * 6,
-            'Meets Threshold?': [True] * 6,
+            'Meets Threshold?': pd.Series([True] * 6, dtype='boolean'),
         }
         expected_details_column_shapes = pd.DataFrame(expected_details_column_shapes_dict)
         expected_details_cpt = pd.DataFrame(expected_details_cpt__dict)
@@ -314,7 +314,7 @@ def test_quality_report_with_object_datetimes(self):
                 np.nan,
             ],
             'Real Association': [np.nan] * 6,
-            'Meets Threshold?': [True] * 6,
+            'Meets Threshold?': pd.Series([True] * 6, dtype='boolean'),
         }
         expected_details_column_shapes = pd.DataFrame(expected_details_column_shapes_dict)
         expected_details_cpt = pd.DataFrame(expected_details_cpt__dict)
@@ -394,7 +394,9 @@ def test_report_end_to_end_with_errors(self):
             'Real Correlation': [np.nan] * 6,
             'Synthetic Correlation': [np.nan] * 6,
             'Real Association': [np.nan] * 6,
-            'Meets Threshold?': [np.nan, True, True, np.nan, np.nan, True],
+            'Meets Threshold?': pd.Series(
+                [np.nan, True, True, np.nan, np.nan, True], dtype='boolean'
+            ),
             'Error': [
                 'AttributeError',  # This can be either ValueError or AttributeError
                 None,
@@ -417,6 +419,27 @@ def test_report_end_to_end_with_errors(self):
         pd.testing.assert_frame_equal(col_pair_report[1:], expected_details_cpt[1:])
         assert report.get_score() == 0.8204378797402054
 
+    def test_meets_threshold_column_has_boolean_dtype_with_errors(self):
+        """Test that 'Meets Threshold?' column contains booleans when errors occur."""
+        # Setup
+        real_data, synthetic_data, metadata = load_demo(modality='single_table')
+        real_data.loc[2, 'second_perc'] = 'a'  # Corrupt data to trigger errors
+
+        # Run
+        report = QualityReport()
+        report.generate(real_data, synthetic_data, metadata, verbose=False)
+        details = report.get_details('Column Pair Trends')
+
+        # Assert
+        meets_threshold_col = details['Meets Threshold?']
+        assert meets_threshold_col.dtype == 'boolean'
+
+        # Ensure non-NA values are actual booleans, not integers
+        non_na_values = meets_threshold_col.dropna()
+        assert len(non_na_values) > 0
+        for val in non_na_values:
+            assert isinstance(val, np.bool_)
+
     def test_report_with_column_nan(self):
         """Test the report with column full of NaNs."""
         # Setup
@@ -538,7 +561,9 @@ def test_report_with_column_nan(self):
                 np.nan,
             ],
             'Real Association': [np.nan] * 10,
-            'Meets Threshold?': [True, True, True, np.nan, True, True, np.nan, True, True, True],
+            'Meets Threshold?': pd.array(
+                [True, True, True, pd.NA, True, True, pd.NA, True, True, True], dtype='boolean'
+            ),
             'Error': [
                 None,
                 None,
diff --git a/tests/unit/reports/single_table/_properties/test_column_pair_trends.py b/tests/unit/reports/single_table/_properties/test_column_pair_trends.py
@@ -496,7 +496,7 @@ def test__generate_details_real_correlation_threshold(self, correlation_compute_
             'Real Correlation': [0.2],
             'Synthetic Correlation': [0.1],
             'Real Association': [np.nan],
-            'Meets Threshold?': [False],
+            'Meets Threshold?': pd.Series([False], dtype='boolean'),
         })
         pd.testing.assert_frame_equal(details, expected_details)
         correlation_compute_mock.assert_called_once()
@@ -531,7 +531,7 @@ def test__generate_details_real_association_threshold(self, contingency_compute_
             'Real Correlation': [np.nan],
             'Synthetic Correlation': [np.nan],
             'Real Association': [0.2],
-            'Meets Threshold?': [False],
+            'Meets Threshold?': pd.Series([False], dtype='boolean'),
         })
         pd.testing.assert_frame_equal(details, expected_details)
         _, contingency_kwargs = contingency_compute_mock.call_args
@@ -641,7 +641,7 @@ def test_get_visualization_layout_alignment(self):
             'Real Correlation': [0.5],
             'Synthetic Correlation': [0.6],
             'Real Association': [0.2],
-            'Meets Threshold?': [True],
+            'Meets Threshold?': pd.Series([True], dtype='boolean'),
         })
 
         # Run