[Sample KDE] add a test

mclprobability · mclprobability · commit 356d8d0fff38 · 2025-05-16T11:33:47.000+02:00
diff --git a/tests/test_kde.py b/tests/test_kde.py
@@ -1,160 +1,210 @@
-"""Tests that check whether the kernel density estimator behaves as expected."""
-
-from itertools import product
-from functools import partial
-import math
-import random
-import unittest
-
-import torch
-import numpy as np
-from scipy.special import gamma
-from torch.autograd import gradcheck
-
-from torchkde.kernels import *
-from torchkde.modules import KernelDensity
-from torchkde.bandwidths import SUPPORTED_BANDWIDTHS
-
-BANDWIDTHS = [1.0, 5.0] + SUPPORTED_BANDWIDTHS
-DIMS = [1, 2]
-TOLERANCE = 1e-1
-WEIGHTS = [False, True]
-
-DEVICES = ["cpu"]
-
-N1 = 100
-N2 = 10
-GRID_N = 1000
-GRID_RG = 100
-
-
-class TestKDE(unittest.TestCase):
-    def setUp(self):
-        torch.manual_seed(0)
-        random.seed(0)
-        np.random.seed(0)
-        torch.backends.cudnn.deterministic = True
-        torch.backends.cudnn.benchmark = False
-
-    def test_integral(self):
-        """Test that the kernel density estimator integrates to 1."""
-        for kernel_str, bandwidth, dim, weights in product(SUPPORTED_KERNELS, BANDWIDTHS, DIMS, WEIGHTS):
-            if kernel_str == 'von-mises-fisher':
-                # Skip the von-mises-fisher kernel, must be handled differently
-                # as it is not defined in the same way as the other kernels
-                continue
-            X = sample_from_gaussian(dim, N1)
-            # Fit a kernel density estimator to the data
-            kde = KernelDensity(bandwidth=bandwidth, kernel=kernel_str)
-            if weights:
-                weights = torch.rand((N1,)).exp()
-                _ = kde.fit(X, sample_weight=weights)
-            else:
-                _ = kde.fit(X)
-            # assess whether the kernel integrates to 1
-            # evaluate the kernel density estimator at a grid of 2D points
-            # Create ranges for each dimension
-            ranges = [torch.linspace(-GRID_RG, GRID_RG, GRID_N) for _ in range(dim)]
-            # Create the d-dimensional meshgrid
-            meshgrid = torch.meshgrid(*ranges, indexing='ij')  # 'ij' indexing for Cartesian coordinates
-
-            # Convert meshgrid to a single tensor of shape (n_points, d)
-            grid_points = torch.stack(meshgrid, dim=-1).reshape(-1, dim)
-            probs = kde.score_samples(grid_points).exp()
-            delta = (GRID_RG * 2) / GRID_N
-            integral = probs.sum() * (delta**dim)
-            self.assertTrue((integral - 1.0).abs() < TOLERANCE, 
-                            f"""Kernel {kernel_str}, for dimensionality {str(dim)} 
-                            and bandwidth {str(bandwidth)} does not integrate to 1.""")
-    
-    def test_vmf_integral(self): # von-Mises-Fisher must be tested differently from other kernels
-        for bandwidth, dim, weights in product(BANDWIDTHS, DIMS, WEIGHTS):
-            if dim == 1 or type(bandwidth) == str:
-                # Skip the von-mises-fisher kernel, must be handled differently
-                # as it is not defined in the same way as the other kernels
-                continue
-            X = sample_from_gaussian(dim, N1)
-            X = X / X.norm(dim=1, keepdim=True) # project onto sphere
-            # Fit a kernel density estimator to the data
-            kde = KernelDensity(bandwidth=bandwidth, kernel='von-mises-fisher')
-            if weights:
-                weights = torch.rand((N1,)).exp()
-                _ = kde.fit(X, sample_weight=weights)
-            else:
-                _ = kde.fit(X)
-            # assess whether the kernel integrates to 1
-
-            # Create the d-dimensional meshgrid
-            mesh_samples = sample_from_gaussian(dim, GRID_N**dim)
-            mesh_samples = mesh_samples / mesh_samples.norm(dim=1, keepdim=True) # project onto sphere
-
-            probs = kde.score_samples(mesh_samples).exp()
-            surface_area = 2 * math.pi ** (dim / 2) / gamma(dim / 2)
-            integral = probs.mean() * surface_area
-            self.assertTrue((integral - 1.0).abs() < TOLERANCE, 
-                            f"""Kernel von-mises-fisher, for dimensionality {str(dim)} 
-                            and bandwidth {str(bandwidth)} does not integrate to 1.""")
-
-                    
-    def test_diffble(self, bandwidth=torch.tensor(1.0), eps=1e-07):
-        """Test that the kernel density estimator is differentiable."""
-        for kernel_str, dim in product(SUPPORTED_KERNELS, DIMS):
-            def fit_and_eval(X, X_new, bandwidth):
-                kde = KernelDensity(bandwidth=bandwidth, kernel=kernel_str)
-                _ = kde.fit(X)
-                return kde.score_samples(X_new)
-            X = sample_from_gaussian(dim, N1).to(torch.float64) # relevant for the gradient check to convert to double
-            X_new = sample_from_gaussian(dim, N2).to(torch.float64)
-
-            if kernel_str == "von-mises-fisher": # normalization required
-                if dim == 1:
-                    continue
-                # Project the data onto the unit sphere
-                X = X / X.norm(dim=1, keepdim=True)
-                X_new = X_new / X_new.norm(dim=1, keepdim=True)
-
-            bandwidth = bandwidth.to(torch.float64)
-
-            X.requires_grad = True
-            X_new.requires_grad = False
-            bandwidth.requires_grad = False
-
-            # Check that the kernel density estimator is differentiable w.r.t. the training data
-            fnc = partial(fit_and_eval, X_new=X_new, bandwidth=bandwidth)
-            self.assertTrue(gradcheck(lambda X_: fnc(X=X_), (X,), raise_exception=False, eps=eps), 
-                            f"""Kernel {kernel_str}, for dimensionality {str(dim)} is not differentiable w.r.t training data.""")
-            
-            if not kernel_str == "von-mises-fisher": # normalization required
-                X.requires_grad = False
-                X_new.requires_grad = False
-                bandwidth.requires_grad = True
-
-                # Check that the kernel density estimator is differentiable w.r.t. the bandwidth
-                fnc = partial(fit_and_eval, X=X, X_new=X_new)
-                self.assertTrue(gradcheck(lambda bandwidth_: fnc(bandwidth=bandwidth_), (bandwidth,), raise_exception=False, eps=eps), 
-                                f"""Kernel {kernel_str}, for dimensionality {str(dim)} is not differentiable w.r.t. the bandwidth.""")
-            
-            X.requires_grad = False
-            X_new.requires_grad = True
-            bandwidth.requires_grad = False
-
-            # Check that the kernel density estimator is differentiable w.r.t. the evaluation data
-            fnc = partial(fit_and_eval, X=X, bandwidth=bandwidth)
-            self.assertTrue(gradcheck(lambda X_new_: fnc(X_new=X_new_), (X_new,), raise_exception=False, eps=eps), 
-                            f"""Kernel {kernel_str}, for dimensionality {str(dim)} is not differentiable w.r.t evaluation data.""")
-            
-
-def sample_from_gaussian(dim, N):
-    # sample data from a normal distribution
-    mean = torch.zeros(dim)
-    covariance_matrix = torch.eye(dim) 
-
-    # Create the multivariate Gaussian distribution
-    multivariate_normal = torch.distributions.MultivariateNormal(mean, covariance_matrix)
-    X = multivariate_normal.sample((N,))
-    return X
-
-
-if __name__ == "__main__":
-    torch.manual_seed(0) # ensure reproducibility
-    unittest.main()
+"""Tests that check whether the kernel density estimator behaves as expected."""
+
+from itertools import product
+from functools import partial
+import math
+import random
+import unittest
+
+import torch
+from torch import distributions as dist
+import numpy as np
+from scipy.special import gamma
+from torch.autograd import gradcheck
+
+import torchkde
+from torchkde.kernels import *
+from torchkde.modules import KernelDensity
+from torchkde.bandwidths import SUPPORTED_BANDWIDTHS
+
+BANDWIDTHS = [1.0, 5.0] + SUPPORTED_BANDWIDTHS
+DIMS = [1, 2]
+TOLERANCE = 1e-1
+WEIGHTS = [False, True]
+
+DEVICES = ["cpu"]
+
+N1 = 100
+N2 = 10
+GRID_N = 1000
+GRID_RG = 100
+
+
+class TestKDE(unittest.TestCase):
+    def setUp(self):
+        torch.manual_seed(0)
+        random.seed(0)
+        np.random.seed(0)
+        torch.backends.cudnn.deterministic = True
+        torch.backends.cudnn.benchmark = False
+
+    def test_integral(self):
+        """Test that the kernel density estimator integrates to 1."""
+        for kernel_str, bandwidth, dim, weights in product(SUPPORTED_KERNELS, BANDWIDTHS, DIMS, WEIGHTS):
+            if kernel_str == 'von-mises-fisher':
+                # Skip the von-mises-fisher kernel, must be handled differently
+                # as it is not defined in the same way as the other kernels
+                continue
+            X = sample_from_gaussian(dim, N1)
+            # Fit a kernel density estimator to the data
+            kde = KernelDensity(bandwidth=bandwidth, kernel=kernel_str)
+            if weights:
+                weights = torch.rand((N1,)).exp()
+                _ = kde.fit(X, sample_weight=weights)
+            else:
+                _ = kde.fit(X)
+            # assess whether the kernel integrates to 1
+            # evaluate the kernel density estimator at a grid of 2D points
+            # Create ranges for each dimension
+            ranges = [torch.linspace(-GRID_RG, GRID_RG, GRID_N) for _ in range(dim)]
+            # Create the d-dimensional meshgrid
+            meshgrid = torch.meshgrid(*ranges, indexing='ij')  # 'ij' indexing for Cartesian coordinates
+
+            # Convert meshgrid to a single tensor of shape (n_points, d)
+            grid_points = torch.stack(meshgrid, dim=-1).reshape(-1, dim)
+            probs = kde.score_samples(grid_points).exp()
+            delta = (GRID_RG * 2) / GRID_N
+            integral = probs.sum() * (delta**dim)
+            self.assertTrue((integral - 1.0).abs() < TOLERANCE, 
+                            f"""Kernel {kernel_str}, for dimensionality {str(dim)} 
+                            and bandwidth {str(bandwidth)} does not integrate to 1.""")
+    
+    def test_vmf_integral(self): # von-Mises-Fisher must be tested differently from other kernels
+        for bandwidth, dim, weights in product(BANDWIDTHS, DIMS, WEIGHTS):
+            if dim == 1 or type(bandwidth) == str:
+                # Skip the von-mises-fisher kernel, must be handled differently
+                # as it is not defined in the same way as the other kernels
+                continue
+            X = sample_from_gaussian(dim, N1)
+            X = X / X.norm(dim=1, keepdim=True) # project onto sphere
+            # Fit a kernel density estimator to the data
+            kde = KernelDensity(bandwidth=bandwidth, kernel='von-mises-fisher')
+            if weights:
+                weights = torch.rand((N1,)).exp()
+                _ = kde.fit(X, sample_weight=weights)
+            else:
+                _ = kde.fit(X)
+            # assess whether the kernel integrates to 1
+
+            # Create the d-dimensional meshgrid
+            mesh_samples = sample_from_gaussian(dim, GRID_N**dim)
+            mesh_samples = mesh_samples / mesh_samples.norm(dim=1, keepdim=True) # project onto sphere
+
+            probs = kde.score_samples(mesh_samples).exp()
+            surface_area = 2 * math.pi ** (dim / 2) / gamma(dim / 2)
+            integral = probs.mean() * surface_area
+            self.assertTrue((integral - 1.0).abs() < TOLERANCE, 
+                            f"""Kernel von-mises-fisher, for dimensionality {str(dim)} 
+                            and bandwidth {str(bandwidth)} does not integrate to 1.""")
+
+                    
+    def test_diffble(self, bandwidth=torch.tensor(1.0), eps=1e-07):
+        """Test that the kernel density estimator is differentiable."""
+        for kernel_str, dim in product(SUPPORTED_KERNELS, DIMS):
+            def fit_and_eval(X, X_new, bandwidth):
+                kde = KernelDensity(bandwidth=bandwidth, kernel=kernel_str)
+                _ = kde.fit(X)
+                return kde.score_samples(X_new)
+            X = sample_from_gaussian(dim, N1).to(torch.float64) # relevant for the gradient check to convert to double
+            X_new = sample_from_gaussian(dim, N2).to(torch.float64)
+
+            if kernel_str == "von-mises-fisher": # normalization required
+                if dim == 1:
+                    continue
+                # Project the data onto the unit sphere
+                X = X / X.norm(dim=1, keepdim=True)
+                X_new = X_new / X_new.norm(dim=1, keepdim=True)
+
+            bandwidth = bandwidth.to(torch.float64)
+
+            X.requires_grad = True
+            X_new.requires_grad = False
+            bandwidth.requires_grad = False
+
+            # Check that the kernel density estimator is differentiable w.r.t. the training data
+            fnc = partial(fit_and_eval, X_new=X_new, bandwidth=bandwidth)
+            self.assertTrue(gradcheck(lambda X_: fnc(X=X_), (X,), raise_exception=False, eps=eps), 
+                            f"""Kernel {kernel_str}, for dimensionality {str(dim)} is not differentiable w.r.t training data.""")
+            
+            if not kernel_str == "von-mises-fisher": # normalization required
+                X.requires_grad = False
+                X_new.requires_grad = False
+                bandwidth.requires_grad = True
+
+                # Check that the kernel density estimator is differentiable w.r.t. the bandwidth
+                fnc = partial(fit_and_eval, X=X, X_new=X_new)
+                self.assertTrue(gradcheck(lambda bandwidth_: fnc(bandwidth=bandwidth_), (bandwidth,), raise_exception=False, eps=eps), 
+                                f"""Kernel {kernel_str}, for dimensionality {str(dim)} is not differentiable w.r.t. the bandwidth.""")
+            
+            X.requires_grad = False
+            X_new.requires_grad = True
+            bandwidth.requires_grad = False
+
+            # Check that the kernel density estimator is differentiable w.r.t. the evaluation data
+            fnc = partial(fit_and_eval, X=X, bandwidth=bandwidth)
+            self.assertTrue(gradcheck(lambda X_new_: fnc(X_new=X_new_), (X_new,), raise_exception=False, eps=eps), 
+                            f"""Kernel {kernel_str}, for dimensionality {str(dim)} is not differentiable w.r.t evaluation data.""")
+
+    def test_sampling_adheres_to_weights(self,):
+        # test if the sample_weights passed in fit(X, sample_weights=...) are respected on sampling
+        n_samples=2000
+        
+        # create a GMM with 2 components with weights pi
+        pi = torch.tensor([0.9, 0.05]) # 90 % for component 1, 0.5 % for component 2 (does not need to sum to 1)
+        loc1 = torch.tensor([10.,10])
+        cov1 = torch.diag(torch.tensor([1.,1]))
+        loc2 = torch.tensor([0.,0])
+        cov2 = torch.diag(torch.tensor([1.,1]))
+        weights1 = torch.ones((n_samples,))*pi[0]
+        weights2 = torch.ones((n_samples,))*pi[1]
+
+        locs = torch.stack([loc1, loc2]) # Shape: [n_components, event_shape] = [2, 2]
+        covs = torch.stack([cov1, cov2]) # Shape: [n_components, event_shape, event_shape] = [2, 2, 2]
+
+        component_distribution = dist.multivariate_normal.MultivariateNormal(
+            loc=locs,
+            covariance_matrix=covs
+        )
+
+        # 2. Create the mixing distribution (Categorical)
+        # pi is interpreted as weights in linear-scale
+        mixing_distribution = dist.Categorical(probs=pi)
+
+        # 3. Create the MixtureSameFamily distribution
+        # This combines the mixing and component distributions
+        gmm = dist.MixtureSameFamily(
+            mixture_distribution=mixing_distribution,
+            component_distribution=component_distribution
+        )
+
+
+        X = component_distribution.sample((n_samples,))
+        X1 = X[:,0,:]
+        X2 = X[:,1,:]
+
+        kde = torchkde.KernelDensity(bandwidth=.5, kernel='gaussian') # create kde object with isotropic bandwidth matrix
+        kde.fit(torch.concat((X1, X2), dim=0), sample_weight=torch.concat((weights1, weights2), dim=0)) # fit kde to weighted data
+
+        samples_from_kde = kde.sample(n_samples)
+        samples_from_gmm = gmm.sample((n_samples,))
+
+        component_1_fraction_kde = torch.count_nonzero(torch.where(samples_from_kde[:,0] > 5., 1.0, 0.0)) / n_samples
+        component_1_fraction_gmm = torch.count_nonzero(torch.where(samples_from_gmm[:,0] > 5., 1.0, 0.0)) / n_samples
+        print(component_1_fraction_kde / component_1_fraction_gmm)
+        self.assertTrue(0.9 < (component_1_fraction_kde / component_1_fraction_gmm) < 1.1, "Component weights must be considered on sampling.")
+            
+
+def sample_from_gaussian(dim, N):
+    # sample data from a normal distribution
+    mean = torch.zeros(dim)
+    covariance_matrix = torch.eye(dim) 
+
+    # Create the multivariate Gaussian distribution
+    multivariate_normal = torch.distributions.MultivariateNormal(mean, covariance_matrix)
+    X = multivariate_normal.sample((N,))
+    return X
+
+
+if __name__ == "__main__":
+    torch.manual_seed(0) # ensure reproducibility
+    unittest.main()