Performance improvements in TSNE algorithm (#1087)

Vika-F · napetrov · commit 5275ebac37c4 · 2022-12-15T13:53:45.000Z
diff --git a/.ci/pipeline/ci.yml b/.ci/pipeline/ci.yml
@@ -40,6 +40,9 @@ jobs:
   pool:
     vmImage: 'ubuntu-22.04'
   steps:
+  - script: |
+      bash .ci/scripts/describe_system.sh
+    displayName: 'System info'
   - task: UsePythonVersion@0
     inputs:
       versionSpec: '3.9'
diff --git a/daal4py/sklearn/manifold/_t_sne.py b/daal4py/sklearn/manifold/_t_sne.py
@@ -33,9 +33,11 @@
 from .._device_offload import support_usm_ndarray
 
 if sklearn_check_version('0.22'):
-    from sklearn.manifold._t_sne import _joint_probabilities, _joint_probabilities_nn
+    from sklearn.manifold._t_sne import _joint_probabilities
+    from sklearn.manifold._t_sne import _joint_probabilities_nn
 else:
-    from sklearn.manifold.t_sne import _joint_probabilities, _joint_probabilities_nn
+    from sklearn.manifold.t_sne import _joint_probabilities
+    from sklearn.manifold.t_sne import _joint_probabilities_nn
 
 
 class TSNE(BaseTSNE):
@@ -98,8 +100,19 @@ def _daal_tsne(self, P, n_samples, X_embedded):
         # * final optimization with momentum at 0.8
 
         # N, nnz, n_iter_without_progress, n_iter
-        size_iter = np.array([[n_samples], [P.nnz], [self.n_iter_without_progress],
-                             [self.n_iter]], dtype=P.dtype)
+        size_iter = [[n_samples], [P.nnz],
+                     [self.n_iter_without_progress],
+                     [self.n_iter]]
+
+        # Pass params to daal4py backend
+        if daal_check_version((2023, 'P', 1)):
+            size_iter.extend(
+                [[self._EXPLORATION_N_ITER],
+                 [self._N_ITER_CHECK]]
+            )
+
+        size_iter = np.array(size_iter, dtype=P.dtype)
+
         params = np.array([[self.early_exaggeration], [self._learning_rate],
                           [self.min_grad_norm], [self.angle]], dtype=P.dtype)
         results = np.zeros((3, 1), dtype=P.dtype)  # curIter, error, gradNorm
@@ -164,17 +177,28 @@ def _fit(self, X, skip_num_points=0):
                                  "or 'auto'.")
 
         if hasattr(self, 'square_distances'):
-            if self.square_distances not in [True, 'legacy', 'deprecated']:
-                raise ValueError("'square_distances' must be True or 'legacy'.")
-            if self.metric != "euclidean" and self.square_distances is not True:
-                warnings.warn(("'square_distances' has been introduced in 0.24"
-                               "to help phase out legacy squaring behavior. The "
-                               "'legacy' setting will be removed in 0.26, and the "
-                               "default setting will be changed to True. In 0.28, "
-                               "'square_distances' will be removed altogether,"
-                               "and distances will be squared by default. Set "
-                               "'square_distances'=True to silence this warning."),
-                              FutureWarning)
+            if sklearn_check_version("1.1"):
+                if self.square_distances != "deprecated":
+                    warnings.warn(
+                        "The parameter `square_distances` has not effect "
+                        "and will be removed in version 1.3.",
+                        FutureWarning,
+                    )
+            else:
+                if self.square_distances not in [True, "legacy"]:
+                    raise ValueError(
+                        "'square_distances' must be True or 'legacy'.")
+                if self.metric != "euclidean" and self.square_distances is not True:
+                    warnings.warn(
+                        "'square_distances' has been introduced in 0.24 to help phase "
+                        "out legacy squaring behavior. The 'legacy' setting will be "
+                        "removed in 1.1 (renaming of 0.26), and the default setting "
+                        "will be changed to True. In 1.3, 'square_distances' will be "
+                        "removed altogether, and distances will be squared by "
+                        "default. Set 'square_distances'=True to silence this "
+                        "warning.",
+                        FutureWarning,
+                    )
 
         if self.method == 'barnes_hut':
             if sklearn_check_version('0.23'):
@@ -242,8 +266,12 @@ def _fit(self, X, skip_num_points=0):
                     distances = pairwise_distances(X, metric=self.metric,
                                                    squared=True)
                 else:
+                    metric_params_ = {}
+                    if sklearn_check_version('1.1'):
+                        metric_params_ = self.metric_params or {}
                     distances = pairwise_distances(X, metric=self.metric,
-                                                   n_jobs=self.n_jobs)
+                                                   n_jobs=self.n_jobs,
+                                                   **metric_params_)
 
             if np.any(distances < 0):
                 raise ValueError("All distances should be positive, the "
@@ -272,12 +300,22 @@ def _fit(self, X, skip_num_points=0):
                       .format(n_neighbors))
 
             # Find the nearest neighbors for every point
-            knn = NearestNeighbors(
-                algorithm='auto',
-                n_jobs=self.n_jobs,
-                n_neighbors=n_neighbors,
-                metric=self.metric,
-            )
+            knn = None
+            if sklearn_check_version("1.1"):
+                knn = NearestNeighbors(
+                    algorithm='auto',
+                    n_jobs=self.n_jobs,
+                    n_neighbors=n_neighbors,
+                    metric=self.metric,
+                    metric_params=self.metric_params
+                )
+            else:
+                knn = NearestNeighbors(
+                    algorithm='auto',
+                    n_jobs=self.n_jobs,
+                    n_neighbors=n_neighbors,
+                    metric=self.metric
+                )
             t0 = time()
             knn.fit(X)
             duration = time() - t0
@@ -336,11 +374,13 @@ def _fit(self, X, skip_num_points=0):
         # Laurens van der Maaten, 2009.
         degrees_of_freedom = max(self.n_components - 1, 1)
 
-        daal_ready = self.method == 'barnes_hut' and self.n_components == 2 and \
-            self.verbose == 0 and daal_check_version((2021, 'P', 600))
+        daal_ready = self.method == 'barnes_hut' and \
+            self.n_components == 2 and self.verbose == 0 and \
+            daal_check_version((2021, 'P', 600))
 
         if daal_ready:
-            X_embedded = check_array(X_embedded, dtype=[np.float32, np.float64])
+            X_embedded = check_array(
+                X_embedded, dtype=[np.float32, np.float64])
             return self._daal_tsne(
                 P,
                 n_samples,
diff --git a/requirements-dev.txt b/requirements-dev.txt
diff --git a/setup.py b/setup.py
diff --git a/src/daal4py.cpp b/src/daal4py.cpp
@@ -900,7 +900,7 @@ void c_generate_shuffled_indices(data_or_file & idx, data_or_file & random_state
 
 void c_tsne_gradient_descent(data_or_file & init, data_or_file & p, data_or_file & size_iter, data_or_file & params, data_or_file & results, char dtype)
 {
-#if __INTEL_DAAL__ == 2021 && INTEL_DAAL_VERSION >= 20210600
+#if __INTEL_DAAL__ >= 2021 && INTEL_DAAL_VERSION >= 20210600
     auto initTable                                     = get_table(init);
     auto pTable                                        = get_table(p);
     auto sizeIterTable                                 = get_table(size_iter);
diff --git a/src/daal4py.h b/src/daal4py.h
@@ -55,7 +55,7 @@ using daal::services::LibraryVersionInfo;
 #if __INTEL_DAAL__ == 2021 && INTEL_DAAL_VERSION >= 20210200
     #include "data_management/data/internal/roc_auc_score.h"
 #endif
-#if __INTEL_DAAL__ == 2021 && INTEL_DAAL_VERSION >= 20210600
+#if __INTEL_DAAL__ >= 2021 && INTEL_DAAL_VERSION >= 20210600
     #include "algorithms/tsne/tsne_gradient_descent.h"
 #endif
 

Original file line number	Diff line number	Diff line change
`@@ -900,7 +900,7 @@ void c_generate_shuffled_indices(data_or_file & idx, data_or_file & random_state`
`900`	`900`
`901`	`901`	`void c_tsne_gradient_descent(data_or_file & init, data_or_file & p, data_or_file & size_iter, data_or_file & params, data_or_file & results, char dtype)`
`902`	`902`	`{`
`903`		`-#if __INTEL_DAAL__ == 2021 && INTEL_DAAL_VERSION >= 20210600`
	`903`	`+#if __INTEL_DAAL__ >= 2021 && INTEL_DAAL_VERSION >= 20210600`
`904`	`904`	`auto initTable = get_table(init);`
`905`	`905`	`auto pTable = get_table(p);`
`906`	`906`	`auto sizeIterTable = get_table(size_iter);`