@@ -133,6 +133,7 @@ def kl_divergence_1D(df1: pd.Series, df2: pd.Series) -> np.number:
133133 q = np .histogram (df2 , bins = bins , density = True )[0 ]
134134 return scipy .stats .entropy (p + EPS , q + EPS )
135135
136+
136137def kl_divergence_columnwise (
137138 df1 : pd .DataFrame , df2 : pd .DataFrame , df_mask : pd .DataFrame
138139) -> pd .Series :
@@ -230,7 +231,8 @@ def kolmogorov_smirnov_test(df1: pd.DataFrame, df2: pd.DataFrame) -> pd.Series:
230231
231232
232233def total_variance_distance (df1 : pd .DataFrame , df2 : pd .DataFrame ) -> pd .Series :
233- """Total variance distance for categorical features, based on TVComplement in https://github.com/sdv-dev/SDMetrics
234+ """Total variance distance for categorical features
235+ It is based on TVComplement in https://github.com/sdv-dev/SDMetrics
234236
235237 Parameters
236238 ----------
@@ -436,7 +438,8 @@ def _sum_distance_col(col: pd.Series, col_size: int) -> pd.Series:
436438
437439
438440def _sum_manhattan_distances (df1 : pd .DataFrame ) -> float :
439- """Sum Manhattan distances. It is based on https://www.geeksforgeeks.org/sum-manhattan-distances-pairs-points/
441+ """Sum Manhattan distances.
442+ It is based on https://www.geeksforgeeks.org/sum-manhattan-distances-pairs-points/
440443
441444 Parameters
442445 ----------
@@ -451,7 +454,8 @@ def _sum_manhattan_distances(df1: pd.DataFrame) -> float:
451454
452455
453456def sum_energy_distances (df1 : pd .DataFrame , df2 : pd .DataFrame ) -> float :
454- """Sum of energy distances between df1 and df2. It is based on https://dcor.readthedocs.io/en/latest/theory.html#
457+ """Sum of energy distances between df1 and df2.
458+ It is based on https://dcor.readthedocs.io/en/latest/theory.html#
455459
456460 Parameters
457461 ----------
@@ -508,6 +512,7 @@ def sum_pairwise_distances(df1: pd.DataFrame, df2: pd.DataFrame, metric: str = "
508512# Dataframe-wise metris #
509513###########################
510514
515+
511516def frechet_distance (
512517 df1 : pd .DataFrame ,
513518 df2 : pd .DataFrame ,
@@ -568,4 +573,4 @@ def frechet_distance(
568573 if normalized :
569574 return pd .Series ((frechet_dist / df_true .shape [0 ]), index = ["All" ])
570575 else :
571- return pd .Series (np .repeat (frechet_dist , len (df1 .columns )))
576+ return pd .Series (np .repeat (frechet_dist , len (df1 .columns )))
0 commit comments