Skip to content

Commit 7066b38

Browse files
authored
Merge pull request #14395 from sneaxiy/fix_num_threads_in_fast_pe
Fix num_threads settings in fast_pe
2 parents 10ab177 + 38d32c9 commit 7066b38

File tree

2 files changed

+4
-3
lines changed

2 files changed

+4
-3
lines changed

paddle/fluid/framework/details/fast_threaded_ssa_graph_executor.cc

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -30,8 +30,8 @@ FastThreadedSSAGraphExecutor::FastThreadedSSAGraphExecutor(
3030
local_scopes_(local_scopes),
3131
places_(places),
3232
graph_(std::move(graph)),
33-
pool_(strategy.num_threads_ +
34-
1), // add one more thread for generate op_deps
33+
pool_(strategy.num_threads_),
34+
prepare_pool_(1), // add one more thread for generate op_deps
3535
fetch_ctxs_(places) {
3636
for (auto &op : ir::FilterByNodeWrapper<OpHandleBase>(*graph_)) {
3737
int dep = static_cast<int>(op->NotReadyInputSize());
@@ -160,7 +160,7 @@ void FastThreadedSSAGraphExecutor::RunOpAsync(
160160
});
161161
}
162162
void FastThreadedSSAGraphExecutor::PrepareAtomicOpDeps() {
163-
atomic_op_deps_ = pool_.enqueue([&] {
163+
atomic_op_deps_ = prepare_pool_.enqueue([&] {
164164
auto *op_deps = new std::unordered_map<OpHandleBase *, std::atomic<int>>;
165165
for (auto &pair : op_deps_) {
166166
(*op_deps)[pair.first] = pair.second;

paddle/fluid/framework/details/fast_threaded_ssa_graph_executor.h

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -46,6 +46,7 @@ class FastThreadedSSAGraphExecutor : public SSAGraphExecutor {
4646
std::vector<OpHandleBase *> bootstrap_ops_;
4747

4848
::ThreadPool pool_;
49+
::ThreadPool prepare_pool_;
4950
platform::DeviceContextPool fetch_ctxs_;
5051
std::atomic<int> remaining_;
5152

0 commit comments

Comments
 (0)