IntelPython
diff --git a/‎configs/common/sklearn.json‎
Lines changed: 5 additions & 0 deletions b/‎configs/common/sklearn.json‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎configs/incremental.json‎
Lines changed: 96 additions & 0 deletions b/‎configs/incremental.json‎
Lines changed: 96 additions & 0 deletions
diff --git a/‎configs/regular/batch_for_online.json‎
Lines changed: 84 additions & 0 deletions b/‎configs/regular/batch_for_online.json‎
Lines changed: 84 additions & 0 deletions
diff --git a/‎configs/regular/bf16/dbscan.json‎
Lines changed: 41 additions & 0 deletions b/‎configs/regular/bf16/dbscan.json‎
Lines changed: 41 additions & 0 deletions
diff --git a/‎configs/regular/bf16/ensemble.json‎
Lines changed: 48 additions & 0 deletions b/‎configs/regular/bf16/ensemble.json‎
Lines changed: 48 additions & 0 deletions
diff --git a/‎configs/regular/bf16/kmeans.json‎
Lines changed: 40 additions & 0 deletions b/‎configs/regular/bf16/kmeans.json‎
Lines changed: 40 additions & 0 deletions
diff --git a/‎configs/regular/bf16/knn.json‎
Lines changed: 41 additions & 0 deletions b/‎configs/regular/bf16/knn.json‎
Lines changed: 41 additions & 0 deletions
@@ -12,6 +12,11 @@
                 { "library": "sklearnex", "device": ["cpu", "gpu"] }
             ]
         },
+        "sklearn-ex[gpu] implementations": {
+            "algorithm": [
+                { "library": "sklearnex", "device": ["gpu"] }
+            ]
+        },
         "sklearn-ex[preview] implementations": {
             "algorithm": [
                 { "library": "sklearn", "device": "cpu" },
 
@@ -0,0 +1,96 @@
+{
+    "PARAMETERS_SETS": {
+        "common": {"bench": {"n_runs": 10, "time_limit": 60}},
+        "covariance data": {
+            "data": [
+                {
+                    "source": "make_blobs",
+                    "generation_kwargs": {
+                        "centers": 1,
+                        "n_samples": 1000,
+                        "n_features": [16, 64]
+                    },
+                    "split_kwargs": {"ignore": true}
+                }
+            ]
+        },
+        "basic_statistics data": {
+            "data": {
+                "source": "make_blobs",
+                "generation_kwargs": {
+                    "centers": 1,
+                    "n_samples": 10000,
+                    "n_features": [16, 64]
+                },
+                "split_kwargs": {"ignore": true}
+            }
+        },
+        "linear_regression data": {
+            "data": {
+                "source": "make_regression",
+                "split_kwargs": {"train_size": 0.2, "test_size": 0.8},
+                "generation_kwargs": {
+                    "n_samples": 5000,
+                    "n_features": [40, 100],
+                    "n_informative": 5,
+                    "noise": 2.0
+                }
+            }
+        },
+        "pca data": {
+            "data": {
+                "source": "make_blobs",
+                "generation_kwargs": {
+                    "centers": 1,
+                    "n_samples": 1000,
+                    "n_features": [16, 64]
+                },
+                "split_kwargs": {"ignore": true}
+            }
+        },
+        "covariance": {
+            "algorithm": [
+                {
+                    "estimator": "IncrementalEmpiricalCovariance",
+                    "library": "sklearnex.covariance",
+                    "estimator_methods": {"training": "partial_fit"},
+                    "num_batches": {"training": 2}
+                }
+            ]
+        },
+        "basic_statistics": {
+            "algorithm": [
+                {
+                    "estimator": "IncrementalBasicStatistics",
+                    "library": "sklearnex.basic_statistics",
+                    "num_batches": {"training": 2}
+                }
+            ]
+        },
+        "linear_regression": {
+            "algorithm": [
+                {
+                    "estimator": "IncrementalLinearRegression",
+                    "library": "sklearnex.linear_model",
+                    "num_batches": {"training": 2}
+                }
+            ]
+        },
+        "pca": {
+            "algorithm": [
+                {
+                    "estimator": "IncrementalPCA",
+                    "library": "sklearnex.preview.decomposition",
+                    "num_batches": {"training": 2}
+                }
+            ]
+        }
+    },
+    "TEMPLATES": {
+        "covariance": {"SETS": ["common", "covariance", "covariance data"]},
+        "linear_regression": {
+            "SETS": ["common", "linear_regression", "linear_regression data"]
+        },
+        "pca": {"SETS": ["common", "pca", "pca data"]}
+    }
+}
@@ -0,0 +1,84 @@
+{
+    "INCLUDE": ["../common/sklearn.json"],
+    "PARAMETERS_SETS": {
+        "common": {"bench": {"n_runs": 10}},
+        "basic_statistics data": {
+            "data": {
+                "source": "make_blobs",
+                "generation_kwargs": {
+                    "centers": 1,
+                    "n_samples": 12000000,
+                    "n_features": [10, 100]
+                },
+                "split_kwargs": {"ignore": true}
+            }
+        },
+        "linear_regression data": {
+            "data": {
+                "source": "make_regression",
+                "split_kwargs": {"train_size": 0.2, "test_size": 0.8},
+                "generation_kwargs": {
+                    "n_samples": 12000000,
+                    "n_features": [10, 100],
+                    "n_informative": 5,
+                    "noise": 2.0
+                }
+            }
+        },
+        "pca data": {
+            "data": {
+                "source": "make_blobs",
+                "generation_kwargs": {
+                    "centers": 1,
+                    "n_samples": 12000000,
+                    "n_features": [10, 100]
+                },
+                "split_kwargs": {"ignore": true}
+            }
+        },
+        "basic_statistics": {
+            "algorithm": [
+                {
+                    "estimator": "BasicStatistics",
+                    "library": "sklearnex.basic_statistics",
+                    "estimator_methods": {"training": "fit"}
+                }
+            ]
+        },
+        "covariance": {
+            "algorithm": [
+                {
+                    "estimator": "EmpiricalCovariance",
+                    "library": "sklearnex.preview.covariance",
+                    "estimator_methods": {"training": "fit"}
+                }
+            ]
+        },
+        "linear_regression": {
+            "algorithm": [
+                {
+                    "estimator": "LinearRegression",
+                    "library": "sklearnex.linear_model",
+                    "estimator_methods": {"training": "fit"}
+                }
+            ]
+        },
+        "pca": {
+            "algorithm": [
+                {
+                    "estimator": "PCA",
+                    "library": "sklearnex.decomposition",
+                    "estimator_methods": {"training": "fit"}
+                }
+            ]
+        }
+    },
+    "TEMPLATES": {
+        "basic_statistics": {"SETS": ["common", "basic_statistics", "basic_statistics data", "sklearn-ex[gpu] implementations"]},
+        "covariance": {"SETS": ["common", "basic_statistics data", "sklearn-ex[gpu] implementations", "covariance"]},
+        "linear_regression": {
+            "SETS": ["common", "linear_regression", "linear_regression data", "sklearn-ex[gpu] implementations"]
+        },
+        "pca": {"SETS": ["common", "pca", "pca data", "sklearn-ex[gpu] implementations"]}
+    }
+}
@@ -0,0 +1,41 @@
+{
+    "INCLUDE": ["../../common/sklearn.json"],
+    "PARAMETERS_SETS": {
+        "common dbscan parameters": {
+            "algorithm": {
+                "estimator": "DBSCAN",
+                "estimator_params": {
+                    "eps": "[SPECIAL_VALUE]distances_quantile:0.01",
+                    "min_samples": 5,
+                    "metric": "euclidean"
+                }
+            },
+            "data": {
+                "dtype": ["float32"]
+            }
+        },
+        "sklearn dbscan parameters": {
+            "algorithm": {
+                "estimator_params": {
+                    "algorithm": "brute",
+                    "n_jobs": "[SPECIAL_VALUE]physical_cpus"
+                }
+            }
+        },
+        "synthetic dataset": {
+            "data": [
+                { "source": "make_blobs", "generation_kwargs": { "n_samples": 100000,  "n_features": 10, "centers": 10 }, "algorithm": { "eps": 5, "min_samples": 5 } }
+            ]
+	    }
+    },
+    "TEMPLATES": {
+        "sklearn dbscan": {
+            "SETS": [
+                "sklearn-ex[gpu] implementations",
+                "common dbscan parameters",
+                "sklearn dbscan parameters",
+                "synthetic dataset"
+            ]
+        }
+    }
+}
@@ -0,0 +1,48 @@
+{
+    "INCLUDE": ["../../common/sklearn.json"],
+    "PARAMETERS_SETS": {
+        "common ensemble params": {
+            "algorithm": {
+                "estimator_params": {
+                    "n_estimators": 200,
+                    "max_depth": 16,
+                    "max_samples": 1.0,
+                    "min_samples_split": 5,
+                    "min_samples_leaf": 2,
+                    "min_impurity_decrease": 0.0,
+                    "bootstrap": true,
+                    "random_state": 42
+                }
+            },
+            "data": {
+                "dtype": ["float32"]
+            }
+        },
+        "sklearn ensemble classifier params": {
+            "algorithm": {
+                "estimator": ["RandomForestClassifier", "ExtraTreesClassifier"],
+                "estimator_params": {
+                    "criterion": "gini",
+                    "max_features": "sqrt",
+                    "max_leaf_nodes": null,
+                    "n_jobs": "[SPECIAL_VALUE]physical_cpus"
+                }
+            }
+        },
+        "synthetic data": {
+            "data": [
+                { "source": "make_classification", "split_kwargs": { "train_size": 500000, "test_size": 1000 },    "generation_kwargs": {  "n_samples": 501000, "n_features": 10, "n_classes": 2 },  "algorithm": { "estimator_params": { "n_estimators": 20, "max_depth": 4 } } }
+            ]
+        }
+    },
+    "TEMPLATES": {
+        "sklearn ensemble classification": {
+            "SETS": [
+                "sklearn-ex[gpu] implementations",
+                "common ensemble params",
+                "sklearn ensemble classifier params",
+                "synthetic data"
+            ]
+        }
+    }
+}
@@ -0,0 +1,40 @@
+{
+    "INCLUDE": ["../../common/sklearn.json"],
+    "PARAMETERS_SETS": {
+        "common kmeans parameters": {
+            "algorithm": {
+                "estimator": "KMeans",
+                "estimator_params": {
+                    "n_clusters": "[SPECIAL_VALUE]auto",
+                    "n_init": 1,
+                    "max_iter": 30,
+                    "tol": 1e-3,
+                    "random_state": 42
+                },
+                "estimator_methods": { "inference": "predict" }
+            },
+            "data": {
+                "dtype": ["float32"],
+                "preprocessing_kwargs": { "normalize": true }
+            }
+        },
+        "sklearn kmeans parameters": {
+            "algorithm": { "estimator_params": { "init": "k-means++", "algorithm": "lloyd" } }
+        },
+        "synthetic data": {
+                "data": [
+                    { "source": "make_blobs", "generation_kwargs": { "n_samples": 1000000,  "n_features": 100, "centers": 100 }, "algorithm": { "n_clusters": 100, "max_iter": 100 } }
+                ]
+        }
+    },
+    "TEMPLATES": {
+        "sklearn kmeans": {
+            "SETS": [
+                "sklearn-ex[gpu] implementations",
+                "common kmeans parameters",
+                "sklearn kmeans parameters",
+                "synthetic data"
+            ]
+        }
+    }
+}
@@ -0,0 +1,41 @@
+{
+    "INCLUDE": ["../../common/sklearn.json"],
+    "PARAMETERS_SETS": {
+        "common knn parameters": {
+            "algorithm": {
+                "estimator_params": {
+                    "n_neighbors": [10, 100],
+                    "weights": "uniform"
+                }
+            },
+            "data": {
+                "dtype": ["float32"],
+                "preprocessing_kwargs": { "normalize": true }
+            }
+        },
+        "sklearn knn parameters": {
+            "algorithm": { "estimator_params": { "n_jobs": "[SPECIAL_VALUE]physical_cpus" } }
+        },
+        "synthetic classification data": {
+            "data": [
+		        { "source": "make_classification", "split_kwargs": { "train_size": 50000, "test_size": 1000 },   "generation_kwargs": {  "n_samples": 51000,  "n_features": 100, "n_classes": 2,  "n_informative": "[SPECIAL_VALUE]0.5" } }
+            ]
+        },
+        "synthetic regression data": {
+            "data": [
+		        { "source": "make_regression", "split_kwargs": { "train_size": 50000, "test_size": 1000 },   "generation_kwargs": {  "n_samples": 51000,  "n_features": 100, "noise":1.5 } }
+            ]
+        }
+    },
+    "TEMPLATES": {
+        "sklearn brute knn clsf": {
+            "SETS": [
+                "sklearn-ex[gpu] implementations",
+                "common knn parameters",
+                "sklearn knn parameters",
+                "synthetic classification data",
+                "synthetic regression data"
+            ]
+        }
+    }
+}