only InferShape when input shape has been changed (#1748)

* only InferShape when input shape has been changed * apply input_dim_has_changed_ criterion only when model has one input vector

only InferShape when input shape has been changed (#1748)
* only InferShape when input shape has been changed * apply input_dim_has_changed_ criterion only when model has one input vector
b42f3d49 · Yanzhan Yang · GitHub · 16a0bd75 · b42f3d49 · b42f3d49
隐藏空白更改
内联并排

Showing with 18 addition and 1 deletion

src/framework/executor.cpp src/framework/executor.cpp +17 -1

src/framework/executor.h src/framework/executor.h +1 -0

未找到文件。
--- a/src/framework/executor.cpp
+++ b/src/framework/executor.cpp
@@ -409,6 +409,11 @@ void Executor<Device, T>::SetInput(const Tensor &input,
  target.Resize(input.dims());
  target.ShareDataWith(input);
+  if (feed_indices_.size() == 1) {
+    auto &dim = input.dims();
+    input_dim_has_changed_ = input_dim_last_ != dim;
+    input_dim_last_ = static_cast<DDim>(dim);
+  }
 }
 template <typename Device, typename T>
@@ -425,6 +430,11 @@ void Executor<Device, T>::SetInput(const LoDTensor &input,
  target.Resize(input.dims());
  target.ShareDataWith(input);
  target.set_lod(input.lod());
+  if (feed_indices_.size() == 1) {
+    auto &dim = input.dims();
+    input_dim_has_changed_ = input_dim_last_ != dim;
+    input_dim_last_ = static_cast<DDim>(dim);
+  }
 }
 template <typename Device, typename T>
@@ -469,7 +479,7 @@ PMStatus Executor<Device, T>::Predict() {
    profile[op_index].runBegin = (uint64_t)ts.tv_sec * 1e9 + ts.tv_nsec;
 #endif
    DLOG << "run op: " << op_handler->Type();
-    if (lod_mode_) {
+    if (lod_mode_ && input_dim_has_changed_) {
      op_handler->InferShape();
    }
    op_handler->Run();
@@ -479,6 +489,9 @@ PMStatus Executor<Device, T>::Predict() {
    ++op_index;
 #endif
  }
+  if (feed_indices_.size() == 1) {
+    input_dim_has_changed_ = false;
+  }
 #ifdef PADDLE_MOBILE_PROFILE
  PrintProfile(profile);
@@ -793,6 +806,9 @@ void Executor<GPU_CL, float>::SetInput(const Tensor &input,
    DLOG << "SetInput ---- > ShareDataWith";
  }
  target_tensor->ShareDataWith(input);
+  if (feed_indices_.size() == 1) {
+    input_dim_has_changed_ = input_dim_last_ != input.dims();
+  }
  auto &dim = input.dims();
  input_dim_last_ = static_cast<DDim>(dim);
 }

--- a/src/framework/executor.h
+++ b/src/framework/executor.h
@@ -99,6 +99,7 @@ class Executor {
  // for super resoltion
  DDim input_dim_last_;
+  bool input_dim_has_changed_ = true;
 #ifdef PADDLE_MOBILE_PROFILE
  typedef typename DtypeTensorTrait<Device>::gtype ProfileTensorType;