Skip to content

Commit 4bd6c7f

Browse files
committed
strong scaling, config updates, minor revisions
1 parent b3500dd commit 4bd6c7f

14 files changed

+200
-26
lines changed

configs/spmd/large_scale/basic_stats.json

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@
44
"spmd basicstats parameters": {
55
"algorithm": {
66
"estimator": "BasicStatistics",
7-
"estimator_methods": { "training": "compute" }
7+
"estimator_methods": { "training": "fit" }
88
},
99
"data": {
1010
"split_kwargs": { "test_size": 0.0001 }
@@ -21,7 +21,7 @@
2121
"basicstats": {
2222
"SETS": [
2323
"sklearnex spmd implementation",
24-
"large scale default parameters",
24+
"large scale 2k parameters",
2525
"synthetic data",
2626
"spmd basicstats parameters"
2727
]
Lines changed: 29 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,29 @@
1+
{
2+
"INCLUDE": ["../../common/sklearn.json", "../../spmd/stats_covariance.json", "large_scale.json"],
3+
"PARAMETERS_SETS": {
4+
"spmd basicstats parameters": {
5+
"algorithm": {
6+
"estimator": "BasicStatistics",
7+
"estimator_methods": { "training": "fit" }
8+
},
9+
"data": {
10+
"split_kwargs": { "test_size": 0.0001 }
11+
}
12+
},
13+
"synthetic data": {
14+
"data": [
15+
{ "source": "make_blobs", "generation_kwargs": { "n_samples": 25000000, "n_features": 100, "centers": 1 } }
16+
]
17+
}
18+
},
19+
"TEMPLATES": {
20+
"basicstats": {
21+
"SETS": [
22+
"sklearnex spmd implementation",
23+
"large scale strong 2k parameters",
24+
"synthetic data",
25+
"spmd basicstats parameters"
26+
]
27+
}
28+
}
29+
}

configs/spmd/large_scale/covariance.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,7 @@
2121
"covariance": {
2222
"SETS": [
2323
"sklearnex spmd implementation",
24-
"large scale default parameters",
24+
"large scale 2k parameters",
2525
"synthetic data",
2626
"spmd basicstats parameters"
2727
]
Lines changed: 29 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,29 @@
1+
{
2+
"INCLUDE": ["../../common/sklearn.json", "../../spmd/stats_covariance.json", "large_scale.json"],
3+
"PARAMETERS_SETS": {
4+
"spmd basicstats parameters": {
5+
"algorithm": {
6+
"estimator": "EmpiricalCovariance",
7+
"estimator_methods": { "training": "fit" }
8+
},
9+
"data": {
10+
"split_kwargs": { "test_size": 0.0001 }
11+
}
12+
},
13+
"synthetic data": {
14+
"data": [
15+
{ "source": "make_blobs", "generation_kwargs": { "n_samples": 25000000, "n_features": 100, "centers": 1 } }
16+
]
17+
}
18+
},
19+
"TEMPLATES": {
20+
"covariance": {
21+
"SETS": [
22+
"sklearnex spmd implementation",
23+
"large scale strong 2k parameters",
24+
"synthetic data",
25+
"spmd basicstats parameters"
26+
]
27+
}
28+
}
29+
}

configs/spmd/large_scale/kmeans.json

Lines changed: 5 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -7,15 +7,14 @@
77
"estimator_params": {
88
"algorithm": "lloyd"
99
},
10-
"estimator_methods": { "training": "fit" }
11-
},
12-
"bench": {
13-
"mpi_params": {"n": 48}
10+
"estimator_methods": { "training": "fit", "inference": "predict" }
1411
}
1512
},
1613
"synthetic data": {
1714
"data": [
18-
{ "source": "make_blobs", "generation_kwargs": { "n_samples": 5000000, "n_features": 10, "centers": 10 }, "algorithm": { "n_clusters": 10, "max_iter": 10 } }
15+
{ "source": "make_blobs", "generation_kwargs": { "n_samples": 5000000, "n_features": 10, "centers": 10 }, "algorithm": { "n_clusters": 10, "max_iter": 10 } },
16+
{ "source": "make_blobs", "generation_kwargs": { "n_samples": 30000, "n_features": 1000, "centers": 10 }, "algorithm": { "n_clusters": 10, "max_iter": 10 } },
17+
{ "source": "make_blobs", "generation_kwargs": { "n_samples": 1000000, "n_features": 100, "centers": 100 }, "algorithm": { "n_clusters": 100, "max_iter": 100 } }
1918
]
2019
}
2120
},
@@ -24,7 +23,7 @@
2423
"SETS": [
2524
"synthetic data",
2625
"sklearnex spmd implementation",
27-
"large scale default parameters",
26+
"large scale 2k parameters",
2827
"spmd kmeans parameters"
2928
]
3029
}

configs/spmd/large_scale/knn.json

Lines changed: 1 addition & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -15,9 +15,6 @@
1515
"training": "fit",
1616
"inference": "predict"
1717
}
18-
},
19-
"bench": {
20-
"mpi_params": {}
2118
}
2219
},
2320
"synthetic classification data": {
@@ -35,7 +32,7 @@
3532
"common knn parameters",
3633
"synthetic classification data",
3734
"sklearnex spmd implementation",
38-
"large scale 2k parameters",
35+
"large scale default parameters",
3936
"spmd knn cls parameters"
4037
]
4138
}

configs/spmd/large_scale/large_scale.json

Lines changed: 21 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,16 @@
66
"distributed_split": "None"
77
},
88
"bench": {
9-
"mpi_params": {"n": [1,2,3,4,5,6,7,8,9,10,11,12], "ppn": 12, "-hostfile": "", "-cpu-bind=list:0-7,104-111:8-15,112-119:16-23,120-127:24-31,128-135:32-39,136-143:40-47,144-151:52-59,156-163:60-67,164-171:68-75,172-179:76-83,180-187:84-91,188-195:92-99,196-203": "--envall gpu_tile_compact.sh" }
9+
"mpi_params": {"n": [1,2,6,12], "ppn": 12, "-hostfile": "", "-cpu-bind=list:0-7,104-111:8-15,112-119:16-23,120-127:24-31,128-135:32-39,136-143:40-47,144-151:52-59,156-163:60-67,164-171:68-75,172-179:76-83,180-187:84-91,188-195:92-99,196-203": "--envall gpu_tile_compact.sh" }
10+
}
11+
},
12+
"large scale strong parameters": {
13+
"data": {
14+
"dtype": "float64",
15+
"distributed_split": "rank_based"
16+
},
17+
"bench": {
18+
"mpi_params": {"n": [1,2,6,12], "ppn": 12, "-hostfile": "", "-cpu-bind=list:0-7,104-111:8-15,112-119:16-23,120-127:24-31,128-135:32-39,136-143:40-47,144-151:52-59,156-163:60-67,164-171:68-75,172-179:76-83,180-187:84-91,188-195:92-99,196-203": "--envall gpu_tile_compact.sh" }
1019
}
1120
},
1221
"large scale 2k parameters": {
@@ -15,7 +24,16 @@
1524
"distributed_split": "None"
1625
},
1726
"bench": {
18-
"mpi_params": {"n": [192,384,768,1536,3072,6144,12288,24576], "ppn": 12, "-hostfile": "", "-cpu-bind=list:0-7,104-111:8-15,112-119:16-23,120-127:24-31,128-135:32-39,136-143:40-47,144-151:52-59,156-163:60-67,164-171:68-75,172-179:76-83,180-187:84-91,188-195:92-99,196-203": "--envall gpu_tile_compact.sh" }
27+
"mpi_params": {"n": [1,2,6,12,24,48,96,192,384,768,1536,3072,6144,12288,24576], "ppn": 12, "-hostfile": "", "-cpu-bind=list:0-7,104-111:8-15,112-119:16-23,120-127:24-31,128-135:32-39,136-143:40-47,144-151:52-59,156-163:60-67,164-171:68-75,172-179:76-83,180-187:84-91,188-195:92-99,196-203": "--envall gpu_tile_compact.sh" }
28+
}
29+
},
30+
"large scale strong 2k parameters": {
31+
"data": {
32+
"dtype": "float64",
33+
"distributed_split": "rank_based"
34+
},
35+
"bench": {
36+
"mpi_params": {"n": [1,2,6,12,24,48,96,192,384,768,1536,3072,6144,12288,24576], "ppn": 12, "-hostfile": "", "-cpu-bind=list:0-7,104-111:8-15,112-119:16-23,120-127:24-31,128-135:32-39,136-143:40-47,144-151:52-59,156-163:60-67,164-171:68-75,172-179:76-83,180-187:84-91,188-195:92-99,196-203": "--envall gpu_tile_compact.sh" }
1937
}
2038
},
2139
"large scale impi parameters": {
@@ -24,7 +42,7 @@
2442
"distributed_split": "no"
2543
},
2644
"bench": {
27-
"mpi_params": {"n": [1,2,4,6,12,24], "ppn": 12}
45+
"mpi_params": {"n": [1,2,4,6,9,12], "ppn": 12}
2846
}
2947
}
3048
}

configs/spmd/large_scale/linear_model.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,7 @@
1818
"linreg": {
1919
"SETS": [
2020
"sklearnex spmd implementation",
21-
"large scale default parameters",
21+
"large scale 2k parameters",
2222
"synthetic data",
2323
"spmd linear parameters"
2424
]
Lines changed: 26 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,26 @@
1+
{
2+
"INCLUDE": ["../../common/sklearn.json", "../../regular/linear_model.json", "large_scale.json"],
3+
"PARAMETERS_SETS": {
4+
"spmd linear parameters": {
5+
"algorithm": {
6+
"estimator": "LinearRegression",
7+
"estimator_methods": { "training": "fit" }
8+
}
9+
},
10+
"synthetic data": {
11+
"data": [
12+
{ "source": "make_regression", "generation_kwargs": { "n_samples": 25005000, "n_features": 100, "noise": 1.25 }, "split_kwargs": { "train_size": 25000000, "test_size": 5000 } }
13+
]
14+
}
15+
},
16+
"TEMPLATES": {
17+
"linreg": {
18+
"SETS": [
19+
"sklearnex spmd implementation",
20+
"large scale strong 2k parameters",
21+
"synthetic data",
22+
"spmd linear parameters"
23+
]
24+
}
25+
}
26+
}
Lines changed: 28 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,28 @@
1+
{
2+
"INCLUDE": ["../../common/sklearn.json", "../../regular/logreg.json", "../logreg.json", "large_scale.json"],
3+
"PARAMETERS_SETS": {
4+
"spmd logreg2 parameters": {
5+
"algorithm":{
6+
"estimator": "LogisticRegression",
7+
"estimator_methods": { "inference": "predict" },
8+
"estimator_params": { "max_iter": 30 }
9+
}
10+
},
11+
"synthetic data": {
12+
"data": [
13+
{ "source": "make_classification", "split_kwargs": { "train_size": 10000000, "test_size": 1000 }, "generation_kwargs": { "n_samples": 10001000, "n_features": 100, "n_classes": 2 } }
14+
]
15+
}
16+
},
17+
"TEMPLATES": {
18+
"linreg": {
19+
"SETS": [
20+
"sklearnex spmd implementation",
21+
"large scale strong 2k parameters",
22+
"spmd logreg parameters",
23+
"synthetic data",
24+
"spmd logreg2 parameters"
25+
]
26+
}
27+
}
28+
}

0 commit comments

Comments
 (0)