未验证 提交 fcb9c0b5 编写于 作者: H Hui Zhang 提交者: GitHub

[ cherrypick] Construct exec and ctx only once in cond op to speed up (#47012)

Construct exec and ctx only once in cond op to speed up
上级 de6f15b6
...@@ -14,6 +14,11 @@ limitations under the License. */ ...@@ -14,6 +14,11 @@ limitations under the License. */
#include "paddle/fluid/operators/controlflow/conditional_block_op.h" #include "paddle/fluid/operators/controlflow/conditional_block_op.h"
#ifdef PADDLE_WITH_MKLDNN
#include "paddle/fluid/platform/mkldnn_helper.h"
#endif
DECLARE_bool(use_mkldnn);
namespace paddle { namespace paddle {
namespace framework { namespace framework {
class OpDesc; class OpDesc;
...@@ -73,14 +78,33 @@ class ConditionalBlockInferOp : public ConditionalOp { ...@@ -73,14 +78,33 @@ class ConditionalBlockInferOp : public ConditionalOp {
scopes->front() = &scope.NewScope(); scopes->front() = &scope.NewScope();
auto &cur_scope = *scopes->front(); auto &cur_scope = *scopes->front();
framework::Executor exec(dev_place);
auto *block = Attr<framework::BlockDesc *>("sub_block"); auto *block = Attr<framework::BlockDesc *>("sub_block");
VLOG(3) << "Conditional block.idx = " << block->ID() VLOG(3) << "Conditional block.idx = " << block->ID()
<< ", scope = " << &cur_scope; << ", scope = " << &cur_scope;
exec.Run(*block->Program(), &cur_scope, block->ID(), false);
if (!exec_ || !platform::is_same_place(exec_->GetPlace(), dev_place)) {
auto &pdesc = *block->Program();
exec_.reset(new framework::Executor(dev_place));
#ifdef PADDLE_WITH_MKLDNN
if (FLAGS_use_mkldnn) exec_->EnableMKLDNN(pdesc);
#endif
ctx_ = exec_->Prepare(
pdesc, block->ID(), std::vector<std::string>(), false);
#ifdef PADDLE_WITH_MKLDNN
if (FLAGS_use_mkldnn) {
platform::AttachPointerHashToMKLDNNKey(exec_.get(), dev_place);
platform::RegisterModelLayout(ctx_->ops_, dev_place);
}
#endif
}
exec_->RunPreparedContext(ctx_.get(), &cur_scope, false, true, false);
scope.DeleteScope(scopes->front()); scope.DeleteScope(scopes->front());
} }
} }
private:
mutable std::shared_ptr<framework::Executor> exec_{nullptr};
mutable std::unique_ptr<framework::ExecutorPrepareContext> ctx_{nullptr};
}; };
} // namespace operators } // namespace operators
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册