Skip to content

Commit 8bbf7d6

Browse files
authored
PCA Config Update and Imports Fix (#50)
1 parent 3a0d7b9 commit 8bbf7d6

File tree

15 files changed

+39
-17
lines changed

15 files changed

+39
-17
lines changed

configs/skl_config.json

Lines changed: 10 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -65,7 +65,6 @@
6565
"tol": [0.0]
6666
},
6767
{
68-
"lib": ["daal4py"],
6968
"algorithm": "pca",
7069
"dataset": [
7170
{
@@ -97,9 +96,18 @@
9796
"training": {
9897
"n_samples": 30000
9998
}
99+
},
100+
{
101+
"source": "synthetic",
102+
"type": "classification",
103+
"n_classes": 2,
104+
"n_features": 4000,
105+
"training": {
106+
"n_samples": 6000
107+
}
100108
}
101109
],
102-
"svd-solver": ["correlation"],
110+
"svd-solver": ["full"],
103111
"n-components": [10]
104112
},
105113
{

sklearn_bench/dbscan.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,6 @@
1919
import os
2020
sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
2121
import bench
22-
from sklearn.cluster import DBSCAN
2322
from sklearn.metrics.cluster import davies_bouldin_score
2423

2524
parser = argparse.ArgumentParser(description='scikit-learn DBSCAN benchmark')
@@ -30,6 +29,8 @@
3029
'neighborhood to consider a point a core point')
3130
params = bench.parse_args(parser, n_jobs_supported=True)
3231

32+
from sklearn.cluster import DBSCAN
33+
3334
# Load generated data
3435
X, _, _, _ = bench.load_data(params, add_dtype=True)
3536

sklearn_bench/df_clsf.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,6 @@
2121
import bench
2222

2323
import numpy as np
24-
from sklearn.ensemble import RandomForestClassifier
2524
from sklearn.metrics import accuracy_score
2625

2726
parser = argparse.ArgumentParser(description='scikit-learn random forest '
@@ -47,6 +46,8 @@
4746

4847
params = bench.parse_args(parser)
4948

49+
from sklearn.ensemble import RandomForestClassifier
50+
5051
# Load and convert data
5152
X_train, X_test, y_train, y_test = bench.load_data(params)
5253

sklearn_bench/df_regr.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,6 @@
1919
import argparse
2020
sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
2121
import bench
22-
from sklearn.ensemble import RandomForestRegressor
2322

2423
parser = argparse.ArgumentParser(description='scikit-learn random forest '
2524
'regression benchmark')
@@ -45,6 +44,8 @@
4544

4645
params = bench.parse_args(parser)
4746

47+
from sklearn.ensemble import RandomForestRegressor
48+
4849
# Load and convert data
4950
X_train, X_test, y_train, y_test = bench.load_data(params)
5051

sklearn_bench/distances.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,6 @@
1919
import argparse
2020
sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
2121
import bench
22-
from sklearn.metrics.pairwise import pairwise_distances
2322

2423
parser = argparse.ArgumentParser(description='scikit-learn pairwise distances '
2524
'benchmark')
@@ -28,6 +27,8 @@
2827
help='Metric to test for pairwise distances')
2928
params = bench.parse_args(parser)
3029

30+
from sklearn.metrics.pairwise import pairwise_distances
31+
3132
# Load data
3233
X, _, _, _ = bench.load_data(params, generated_data=['X_train'], add_dtype=True)
3334

sklearn_bench/elasticnet.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -20,8 +20,6 @@
2020
sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
2121
import bench
2222

23-
from sklearn.linear_model import ElasticNet
24-
2523
parser = argparse.ArgumentParser(description='scikit-learn elastic-net regression '
2624
'benchmark')
2725
parser.add_argument('--no-fit-intercept', dest='fit_intercept', default=False,
@@ -37,6 +35,8 @@
3735
help='Tolerance for solver.')
3836
params = bench.parse_args(parser)
3937

38+
from sklearn.linear_model import ElasticNet
39+
4040
# Load data
4141
X_train, X_test, y_train, y_test = bench.load_data(params)
4242

sklearn_bench/kmeans.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,6 @@
2020
sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
2121
import bench
2222
import numpy as np
23-
from sklearn.cluster import KMeans
2423
from sklearn.metrics.cluster import davies_bouldin_score
2524

2625
parser = argparse.ArgumentParser(description='scikit-learn K-means benchmark')
@@ -33,6 +32,8 @@
3332
parser.add_argument('--n-clusters', type=int, help='Number of clusters')
3433
params = bench.parse_args(parser)
3534

35+
from sklearn.cluster import KMeans
36+
3637
# Load and convert generated data
3738
X_train, X_test, _, _ = bench.load_data(params)
3839

sklearn_bench/knn_clsf.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,6 @@
2020
sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
2121
import bench
2222
import numpy as np
23-
from sklearn.neighbors import KNeighborsClassifier
2423
from sklearn.metrics import accuracy_score
2524

2625
parser = argparse.ArgumentParser(
@@ -40,6 +39,8 @@
4039
help='Distance metric to use')
4140
params = bench.parse_args(parser)
4241

42+
from sklearn.neighbors import KNeighborsClassifier
43+
4344
# Load generated data
4445
X_train, X_test, y_train, y_test = bench.load_data(params)
4546
params.n_classes = len(np.unique(y_train))

sklearn_bench/lasso.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,6 @@
1919
import os
2020
sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
2121
import bench
22-
from sklearn.linear_model import Lasso
2322

2423
parser = argparse.ArgumentParser(description='scikit-learn lasso regression '
2524
'benchmark')
@@ -34,6 +33,8 @@
3433
help='Tolerance for solver.')
3534
params = bench.parse_args(parser)
3635

36+
from sklearn.linear_model import Lasso
37+
3738
# Load data
3839
X_train, X_test, y_train, y_test = bench.load_data(params)
3940

sklearn_bench/linear.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,6 @@
2020
import os
2121
sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
2222
import bench
23-
from sklearn.linear_model import LinearRegression
2423

2524
parser = argparse.ArgumentParser(description='scikit-learn linear regression '
2625
'benchmark')
@@ -29,6 +28,8 @@
2928
help="Don't fit intercept (assume data already centered)")
3029
params = bench.parse_args(parser)
3130

31+
from sklearn.linear_model import LinearRegression
32+
3233
# Load data
3334
X_train, X_test, y_train, y_test = bench.load_data(
3435
params, generated_data=['X_train', 'y_train'])

0 commit comments

Comments
 (0)