@@ -25,43 +25,44 @@ ParameterServerController::ParameterServerController(
25
25
int numPorts = config.ports_num () + config.ports_num_for_sparse ();
26
26
27
27
if (config.nics ().empty ()) {
28
- pservers_ .resize (numPorts);
28
+ parameterServers_ .resize (numPorts);
29
29
for (int i = 0 ; i < numPorts; ++i) {
30
30
if (config.rdma_tcp () == " rdma" ) {
31
- pservers_ [i].reset (
31
+ parameterServers_ [i].reset (
32
32
new ParameterServer2 (std::string (), config.port () + i, rdmaCpu++));
33
33
rdmaCpu = rdmaCpu % onlineCpus;
34
34
} else {
35
- pservers_ [i].reset (
35
+ parameterServers_ [i].reset (
36
36
new ParameterServer2 (std::string (), config.port () + i));
37
37
}
38
- CHECK (pservers_[i]->init ()) << " Fail to initialize parameter server"
39
- << config.port () + i;
38
+ CHECK (parameterServers_[i]->init ()) << " Fail to initialize parameter "
39
+ " server on port "
40
+ << config.port () + i;
40
41
}
41
42
} else {
42
43
str::split (config.nics (), ' ,' , &devices);
43
- pservers_ .resize (devices.size () * numPorts);
44
+ parameterServers_ .resize (devices.size () * numPorts);
44
45
for (int i = 0 ; i < numPorts; ++i) {
45
46
for (size_t j = 0 ; j < devices.size (); ++j) {
46
47
if (config.rdma_tcp () == " rdma" ) {
47
- pservers_ [i * devices.size () + j].reset (new ParameterServer2 (
48
+ parameterServers_ [i * devices.size () + j].reset (new ParameterServer2 (
48
49
getIpAddr (devices[j]), config.port () + i, rdmaCpu++));
49
50
rdmaCpu = rdmaCpu % onlineCpus;
50
51
} else {
51
- pservers_ [i * devices.size () + j].reset (
52
+ parameterServers_ [i * devices.size () + j].reset (
52
53
new ParameterServer2 (getIpAddr (devices[j]), config.port () + i));
53
54
}
54
- CHECK (pservers_ [i * devices.size () + j]->init ())
55
- << " Fail to initialize parameter server" << devices[j]
55
+ CHECK (parameterServers_ [i * devices.size () + j]->init ())
56
+ << " Fail to initialize parameter server with device " << devices[j]
56
57
<< config.port () + i;
57
58
}
58
59
}
59
60
}
60
61
}
61
62
62
- ParameterServerController::~ParameterServerController () { this ->join (); }
63
+ ParameterServerController::~ParameterServerController () { this ->wait (); }
63
64
64
- ParameterServerController* ParameterServerController::createByGflags () {
65
+ ParameterServerController* ParameterServerController::createFromGflags () {
65
66
ParameterServerConfig config;
66
67
67
68
config.set_nics (FLAGS_nics);
@@ -79,21 +80,21 @@ ParameterServerController* ParameterServerController::create(
79
80
}
80
81
81
82
void ParameterServerController::start () {
82
- LOG (INFO) << " pserver sizes : " << pservers_.size ();
83
+ LOG (INFO) << " number of parameterServer instances: "
84
+ << parameterServers_.size ();
83
85
int i = 0 ;
84
- for (const auto & pserver : pservers_ ) {
85
- LOG (INFO) << " pserver started : " << i;
86
- pserver ->start ();
86
+ for (const auto & parameterServer : parameterServers_ ) {
87
+ LOG (INFO) << " Starting parameterServer[ " << i << " ] " ;
88
+ parameterServer ->start ();
87
89
i++;
88
90
}
89
91
}
90
92
91
- void ParameterServerController::join () {
92
- LOG (INFO) << " pserver sizes : " << pservers_.size ();
93
+ void ParameterServerController::wait () {
93
94
int i = 0 ;
94
- for (const auto & pserver : pservers_ ) {
95
- LOG (INFO) << " pserver join : " << i;
96
- pserver ->join ();
95
+ for (const auto & parameterServer : parameterServers_ ) {
96
+ LOG (INFO) << " Waiting parameterServer[ " << i << " ] " ;
97
+ parameterServer ->join ();
97
98
i++;
98
99
}
99
100
}
0 commit comments