Skip to content

Commit eb18d53

Browse files
committed
fix num_threads in fast_pe
test=develop
1 parent 5fc3052 commit eb18d53

File tree

2 files changed

+5
-5
lines changed

2 files changed

+5
-5
lines changed

paddle/fluid/framework/details/fast_threaded_ssa_graph_executor.cc

Lines changed: 4 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -29,8 +29,8 @@ FastThreadedSSAGraphExecutor::FastThreadedSSAGraphExecutor(
2929
local_scopes_(local_scopes),
3030
places_(places),
3131
graph_(std::move(graph)),
32-
pool_(strategy.num_threads_ +
33-
1), // add one more thread for generate op_deps
32+
pool_(strategy.num_threads_),
33+
prepare_pool_(1), // add one more thread for generate op_deps
3434
fetch_ctxs_(places) {
3535
auto &ops = graph_->Get<details::GraphOps>("ops");
3636

@@ -155,9 +155,8 @@ void FastThreadedSSAGraphExecutor::RunOpAsync(
155155
});
156156
}
157157
void FastThreadedSSAGraphExecutor::PrepareAtomicOpDeps() {
158-
atomic_op_deps_ = pool_.enqueue([&] {
159-
std::unordered_map<OpHandleBase *, std::atomic<int>> *op_deps =
160-
new std::unordered_map<OpHandleBase *, std::atomic<int>>;
158+
atomic_op_deps_ = prepare_pool_.enqueue([&] {
159+
auto *op_deps = new std::unordered_map<OpHandleBase *, std::atomic<int>>;
161160
for (auto &pair : op_deps_) {
162161
(*op_deps)[pair.first] = pair.second;
163162
}

paddle/fluid/framework/details/fast_threaded_ssa_graph_executor.h

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -46,6 +46,7 @@ class FastThreadedSSAGraphExecutor : public SSAGraphExecutor {
4646
std::vector<OpHandleBase *> bootstrap_ops_;
4747

4848
::ThreadPool pool_;
49+
::ThreadPool prepare_pool_;
4950
platform::DeviceContextPool fetch_ctxs_;
5051
std::atomic<int> remaining_;
5152

0 commit comments

Comments
 (0)