@@ -4,17 +4,17 @@ REGRESSION_SIZE = 1000000x50
4
4
KMEANS_SAMPLES = 1000000
5
5
KMEANS_FEATURES = 50
6
6
KMEANS_SIZE = $(KMEANS_SAMPLES ) x$(KMEANS_FEATURES )
7
- SVM_SAMPLES = 50000
7
+ SVM_SAMPLES = 100000
8
8
SVM_FEATURES = 100
9
9
SVM_SIZE = $(SVM_SAMPLES ) x$(SVM_FEATURES )
10
10
LOGREG_SAMPLES = 100000
11
11
LOGREG_FEATURES = 100
12
12
LOGREG_SIZE = $(LOGREG_SAMPLES ) x$(LOGREG_FEATURES )
13
13
DFCLF_SAMPLES = 10000
14
- DFCLF_FEATURES = 50
14
+ DFCLF_FEATURES = 100
15
15
DFCLF_SIZE = $(DFCLF_SAMPLES ) x$(DFCLF_FEATURES )
16
16
DFREG_SAMPLES = 10000
17
- DFREG_FEATURES = 50
17
+ DFREG_FEATURES = 100
18
18
DFREG_SIZE = $(DFREG_SAMPLES ) x$(DFREG_FEATURES )
19
19
20
20
ITERATIONS = 10
@@ -29,20 +29,24 @@ SHELL = bash -o pipefail
29
29
30
30
# Other options
31
31
NUM_THREADS = -1
32
+ SVM_NUM_THREADS = 0
33
+ LOGREG_NUM_THREADS = $(SVM_NUM_THREADS )
34
+ DFCLF_NUM_THREADS = $(SVM_NUM_THREADS )
35
+ DFREG_NUM_THREADS = $(SVM_NUM_THREADS )
32
36
MULTIPLIER = 100
33
37
DATA_DIR = data/
34
38
DATA_kmeans = data/kmeans_$(KMEANS_SIZE ) .npy
35
39
36
- COMMON_ARGS = --batch '$(BATCH ) ' --arch '$(HOST ) ' \
37
- --num-threads '$(NUM_THREADS ) ' --header
40
+ COMMON_ARGS = --batch '$(BATCH ) ' --arch '$(HOST ) ' \
41
+ --num-threads '$(NUM_THREADS ) ' --header
38
42
39
43
# Define which benchmarks to run
40
- NATIVE_BENCHMARKS = distances ridge linear kmeans svm2 svm5 \
41
- logreg2 logreg5 dfclf2 dfclf5 dfreg pca_daal pca_full
44
+ NATIVE_BENCHMARKS = distances ridge linear kmeans svm2 svm5 \
45
+ logreg2 logreg5 dfclf2 dfclf5 dfreg pca_daal pca_full
42
46
SKLEARN_BENCHMARKS = distances ridge linear kmeans svm2 svm5 \
43
- logreg2 logreg5 dfclf2 dfclf5 dfreg pca_full
47
+ logreg2 logreg5 dfclf2 dfclf5 dfreg pca_full
44
48
DAAL4PY_BENCHMARKS = distances ridge linear kmeans svm2 svm5 \
45
- logreg2 logreg5 dfclf2 dfclf5 dfreg pca_daal pca_full
49
+ logreg2 logreg5 dfclf2 dfclf5 dfreg pca_daal pca_full
46
50
47
51
# Define native benchmark binary names
48
52
NATIVE_distances = distances
@@ -61,41 +65,41 @@ NATIVE_pca_full = pca
61
65
62
66
# Define arguments for native benchmarks
63
67
ARGS_NATIVE_distances = --num-threads "$(NUM_THREADS ) " \
64
- --size "$(DISTANCES_SIZE ) " --header
68
+ --size "$(DISTANCES_SIZE ) " --header
65
69
ARGS_NATIVE_ridge = --num-threads "$(NUM_THREADS ) " \
66
- --size "$(REGRESSION_SIZE ) " --header
70
+ --size "$(REGRESSION_SIZE ) " --header
67
71
ARGS_NATIVE_linear = --num-threads "$(NUM_THREADS ) " \
68
- --size "$(REGRESSION_SIZE ) " --header
72
+ --size "$(REGRESSION_SIZE ) " --header
69
73
ARGS_NATIVE_pca_daal = --num-threads "$(NUM_THREADS ) " --header \
70
- --size "$(REGRESSION_SIZE ) " --svd-solver daal
74
+ --size "$(REGRESSION_SIZE ) " --svd-solver daal
71
75
ARGS_NATIVE_pca_full = --num-threads "$(NUM_THREADS ) " --header \
72
- --size "$(REGRESSION_SIZE ) " --svd-solver full
76
+ --size "$(REGRESSION_SIZE ) " --svd-solver full
73
77
ARGS_NATIVE_kmeans = --num-threads "$(NUM_THREADS ) " --header \
74
- --data-multiplier "$(MULTIPLIER ) " \
75
- --filex data/kmeans_$(KMEANS_SIZE ) .npy \
76
- --filei data/kmeans_$(KMEANS_SIZE ) .init.npy \
77
- --filet data/kmeans_$(KMEANS_SIZE ) .tol.npy
78
- ARGS_NATIVE_svm2 = --fileX data/two/X-$(SVM_SIZE ) .npy \
79
- --fileY data/two/y-$(SVM_SIZE ) .npy \
80
- --num-threads $(SVM_NUM_THREADS ) --header
81
- ARGS_NATIVE_svm5 = --fileX data/multi/X-$(SVM_SIZE ) .npy \
82
- --fileY data/multi/y-$(SVM_SIZE ) .npy \
83
- --num-threads $(SVM_NUM_THREADS ) --header
78
+ --data-multiplier "$(MULTIPLIER ) " \
79
+ --filex data/kmeans_$(KMEANS_SIZE ) .npy \
80
+ --filei data/kmeans_$(KMEANS_SIZE ) .init.npy \
81
+ --filet data/kmeans_$(KMEANS_SIZE ) .tol.npy
82
+ ARGS_NATIVE_svm2 = --fileX data/two/X-$(SVM_SIZE ) .npy \
83
+ --fileY data/two/y-$(SVM_SIZE ) .npy \
84
+ --num-threads $(SVM_NUM_THREADS ) --header
85
+ ARGS_NATIVE_svm5 = --fileX data/multi/X-$(SVM_SIZE ) .npy \
86
+ --fileY data/multi/y-$(SVM_SIZE ) .npy \
87
+ --num-threads $(SVM_NUM_THREADS ) --header
84
88
ARGS_NATIVE_logreg2 = --fileX data/two/X-$(LOGREG_SIZE ) .npy \
85
- --fileY data/two/y-$(LOGREG_SIZE ) .npy \
86
- --num-threads $(LOGREG_NUM_THREADS ) --header
89
+ --fileY data/two/y-$(LOGREG_SIZE ) .npy \
90
+ --num-threads $(LOGREG_NUM_THREADS ) --header
87
91
ARGS_NATIVE_logreg5 = --fileX data/multi/X-$(LOGREG_SIZE ) .npy \
88
- --fileY data/multi/y-$(LOGREG_SIZE ) .npy \
89
- --num-threads $(LOGREG_NUM_THREADS ) --header
92
+ --fileY data/multi/y-$(LOGREG_SIZE ) .npy \
93
+ --num-threads $(LOGREG_NUM_THREADS ) --header
90
94
ARGS_NATIVE_dfclf2 = --fileX data/two/X-$(DFCLF_SIZE ) .npy \
91
- --fileY data/two/y-$(DFCLF_SIZE ) .npy \
92
- --num-threads $(DFCLF_NUM_THREADS ) --header
95
+ --fileY data/two/y-$(DFCLF_SIZE ) .npy \
96
+ --num-threads $(DFCLF_NUM_THREADS ) --header
93
97
ARGS_NATIVE_dfclf5 = --fileX data/multi/X-$(DFCLF_SIZE ) .npy \
94
- --fileY data/multi/y-$(DFCLF_SIZE ) .npy \
95
- --num-threads $(DFCLF_NUM_THREADS ) --header
98
+ --fileY data/multi/y-$(DFCLF_SIZE ) .npy \
99
+ --num-threads $(DFCLF_NUM_THREADS ) --header
96
100
ARGS_NATIVE_dfreg = --fileX data/reg/X-$(DFREG_SIZE ) .npy \
97
- --fileY data/reg/y-$(DFREG_SIZE ) .npy \
98
- --num-threads $(DFREG_NUM_THREADS ) --header
101
+ --fileY data/reg/y-$(DFREG_SIZE ) .npy \
102
+ --num-threads $(DFREG_NUM_THREADS ) --header
99
103
100
104
SKLEARN_distances = distances
101
105
SKLEARN_ridge = ridge
@@ -117,22 +121,22 @@ ARGS_SKLEARN_linear = --size "$(REGRESSION_SIZE)"
117
121
ARGS_SKLEARN_pca_daal = --size "$(REGRESSION_SIZE ) " --svd-solver daal
118
122
ARGS_SKLEARN_pca_full = --size "$(REGRESSION_SIZE ) " --svd-solver full
119
123
ARGS_SKLEARN_kmeans = --data-multiplier "$(MULTIPLIER ) " \
120
- --filex data/kmeans_$(KMEANS_SIZE ) .npy \
121
- --filei data/kmeans_$(KMEANS_SIZE ) .init.npy
122
- ARGS_SKLEARN_svm2 = --fileX data/two/X-$(SVM_SIZE ) .npy \
123
- --fileY data/two/y-$(SVM_SIZE ) .npy
124
+ --filex data/kmeans_$(KMEANS_SIZE ) .npy \
125
+ --filei data/kmeans_$(KMEANS_SIZE ) .init.npy
126
+ ARGS_SKLEARN_svm2 = --fileX data/two/X-$(SVM_SIZE ) .npy \
127
+ --fileY data/two/y-$(SVM_SIZE ) .npy
124
128
ARGS_SKLEARN_svm5 = --fileX data/multi/X-$(SVM_SIZE ) .npy \
125
- --fileY data/multi/y-$(SVM_SIZE ) .npy
129
+ --fileY data/multi/y-$(SVM_SIZE ) .npy
126
130
ARGS_SKLEARN_logreg2 = --fileX data/two/X-$(LOGREG_SIZE ) .npy \
127
- --fileY data/two/y-$(LOGREG_SIZE ) .npy
131
+ --fileY data/two/y-$(LOGREG_SIZE ) .npy
128
132
ARGS_SKLEARN_logreg5 = --fileX data/multi/X-$(LOGREG_SIZE ) .npy \
129
- --fileY data/multi/y-$(LOGREG_SIZE ) .npy
133
+ --fileY data/multi/y-$(LOGREG_SIZE ) .npy
130
134
ARGS_SKLEARN_dfclf2 = --fileX data/two/X-$(DFCLF_SIZE ) .npy \
131
- --fileY data/two/y-$(DFCLF_SIZE ) .npy
135
+ --fileY data/two/y-$(DFCLF_SIZE ) .npy
132
136
ARGS_SKLEARN_dfclf5 = --fileX data/multi/X-$(DFCLF_SIZE ) .npy \
133
- --fileY data/multi/y-$(DFCLF_SIZE ) .npy
134
- ARGS_SKLEARN_dfreg = --fileX data/multi /X-$(DFREG_SIZE ) .npy \
135
- --fileY data/multi /y-$(DFREG_SIZE ) .npy
137
+ --fileY data/multi/y-$(DFCLF_SIZE ) .npy
138
+ ARGS_SKLEARN_dfreg = --fileX data/reg /X-$(DFREG_SIZE ) .npy \
139
+ --fileY data/reg /y-$(DFREG_SIZE ) .npy
136
140
137
141
DAAL4PY_distances = distances
138
142
DAAL4PY_ridge = ridge
@@ -154,22 +158,23 @@ ARGS_DAAL4PY_linear = --size "$(REGRESSION_SIZE)"
154
158
ARGS_DAAL4PY_pca_daal = --size "$(REGRESSION_SIZE ) " --svd-solver daal
155
159
ARGS_DAAL4PY_pca_full = --size "$(REGRESSION_SIZE ) " --svd-solver full
156
160
ARGS_DAAL4PY_kmeans = --data-multiplier "$(MULTIPLIER ) " \
157
- --filex data/kmeans_$(KMEANS_SIZE ) .npy \
158
- --filei data/kmeans_$(KMEANS_SIZE ) .init.npy
159
- ARGS_DAAL4PY_svm2 = --fileX data/two/X-$(SVM_SIZE ) .npy \
160
- --fileY data/two/y-$(SVM_SIZE ) .npy
161
+ --filex data/kmeans_$(KMEANS_SIZE ) .npy \
162
+ --filei data/kmeans_$(KMEANS_SIZE ) .init.npy \
163
+ --filet data/kmeans_$(KMEANS_SIZE ) .tol.npy
164
+ ARGS_DAAL4PY_svm2 = --fileX data/two/X-$(SVM_SIZE ) .npy \
165
+ --fileY data/two/y-$(SVM_SIZE ) .npy
161
166
ARGS_DAAL4PY_svm5 = --fileX data/multi/X-$(SVM_SIZE ) .npy \
162
- --fileY data/multi/y-$(SVM_SIZE ) .npy
167
+ --fileY data/multi/y-$(SVM_SIZE ) .npy
163
168
ARGS_DAAL4PY_logreg2 = --fileX data/two/X-$(LOGREG_SIZE ) .npy \
164
- --fileY data/two/y-$(LOGREG_SIZE ) .npy
169
+ --fileY data/two/y-$(LOGREG_SIZE ) .npy
165
170
ARGS_DAAL4PY_logreg5 = --fileX data/multi/X-$(LOGREG_SIZE ) .npy \
166
- --fileY data/multi/y-$(LOGREG_SIZE ) .npy
171
+ --fileY data/multi/y-$(LOGREG_SIZE ) .npy
167
172
ARGS_DAAL4PY_dfclf2 = --fileX data/two/X-$(DFCLF_SIZE ) .npy \
168
- --fileY data/two/y-$(DFCLF_SIZE ) .npy
173
+ --fileY data/two/y-$(DFCLF_SIZE ) .npy
169
174
ARGS_DAAL4PY_dfclf5 = --fileX data/multi/X-$(DFCLF_SIZE ) .npy \
170
- --fileY data/multi/y-$(DFCLF_SIZE ) .npy
171
- ARGS_DAAL4PY_dfreg = --fileX data/multi /X-$(DFREG_SIZE ) .npy \
172
- --fileY data/multi /y-$(DFREG_SIZE ) .npy
175
+ --fileY data/multi/y-$(DFCLF_SIZE ) .npy
176
+ ARGS_DAAL4PY_dfreg = --fileX data/reg /X-$(DFREG_SIZE ) .npy \
177
+ --fileY data/reg /y-$(DFREG_SIZE ) .npy
173
178
174
179
comma = ,
175
180
0 commit comments