Skip to content

Commit 3667578

Browse files
committed
testing
1 parent d9320dc commit 3667578

File tree

2 files changed

+8
-4
lines changed

2 files changed

+8
-4
lines changed

paddle/fluid/platform/nccl_helper.h

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -108,8 +108,8 @@ struct NCCLContextMap {
108108
for (auto &gpu_id : order_) {
109109
int rank = trainer_id * order_.size() + gpu_id;
110110
PADDLE_ENFORCE(cudaSetDevice(gpu_id));
111-
PADDLE_ENFORCE(
112-
ncclCommInitRank(comms.get() + gpu_id, nranks, *nccl_id, rank));
111+
PADDLE_ENFORCE(platform::dynload::ncclCommInitRank(
112+
comms.get() + gpu_id, nranks, *nccl_id, rank));
113113
}
114114
}
115115
}

python/paddle/fluid/parallel_executor.py

Lines changed: 6 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -30,7 +30,9 @@ def __init__(self,
3030
num_threads=None,
3131
allow_op_delay=False,
3232
share_vars_from=None,
33-
use_default_grad_scale=True):
33+
use_default_grad_scale=True,
34+
num_nodes=0,
35+
trainer_id=0):
3436
"""
3537
ParallelExecutor can run program in parallel.
3638
@@ -129,7 +131,9 @@ def __init__(self,
129131
scope,
130132
local_scopes,
131133
allow_op_delay,
132-
use_default_grad_scale)
134+
use_default_grad_scale,
135+
num_nodes,
136+
trainer_id)
133137
self.scope = scope
134138

135139
def run(self, fetch_list, feed=None, feed_dict=None):

0 commit comments

Comments
 (0)