executor.h 3.2 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17
/* Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#pragma once

#include <map>
W
wangliu 已提交
18
#include <memory>
19 20
#include <string>
#include <vector>
21

22
#include "common/types.h"
L
liuruilong 已提交
23
#include "framework/lod_tensor.h"
L
liuruilong 已提交
24
#include "framework/operator.h"
25
#include "framework/program/program.h"
L
liuruilong 已提交
26
#include "framework/tensor.h"
D
dolphin8 已提交
27 28 29 30
#ifdef PADDLE_EXECUTOR_MULTITHREAD
#include <condition_variable>
#include <mutex>
#include <thread>
D
fix  
dolphin8 已提交
31
#include "common/dep_core.h"
D
dolphin8 已提交
32
#endif
33
using std::string;
34 35 36

namespace paddle_mobile {

W
wangliu 已提交
37
template <typename Dtype = CPU, Precision P = Precision::FP32>
38
class Executor {
W
wangliu 已提交
39
 public:
40 41
  typedef typename PrecisionTrait<P>::ptype Ptype;

L
liuruilong 已提交
42 43 44 45
  /*
   * @b init executor with program load by Loader class
   * @b 用 loader load 的 program 实例化 executor
   * */
46
  Executor(const framework::Program<Dtype> p, int batch_size = 1,
xiebaiyuan's avatar
xiebaiyuan 已提交
47
           bool use_optimize = true, bool loddable = false);
48

L
liuruilong 已提交
49 50 51
  /*
   * @b to predict
   * */
52
  std::shared_ptr<framework::Tensor> Predict(const framework::Tensor &t);
xiebaiyuan's avatar
xiebaiyuan 已提交
53 54 55 56 57
  /*
   * @b to predict
   * */
  std::shared_ptr<framework::LoDTensor> PredictLod(
      const framework::LoDTensor &t);
L
liuruilong 已提交
58 59 60 61 62
  /*
   * @b to predict with vector and dim
   *
   * @b 使用 输入 和 输入的维度信息 进行预测
   * */
63 64 65
  std::vector<Ptype> Predict(const std::vector<Ptype> &input,
                             const std::vector<int64_t> &dims);

W
wangliu 已提交
66
 protected:
67 68 69
  Executor() = default;
  void InitMemory();
  void LoadMemory(const framework::VarDesc var_desc,
70
                  framework::LoDTensor *tensor, char **data);
L
liuruilong 已提交
71
  void InitCombineMemory();
72 73 74 75 76 77
  framework::Program<Dtype> program_;
  int batch_size_ = 1;
  std::shared_ptr<framework::ProgramDesc> to_predict_program_;
  std::shared_ptr<framework::Tensor> Predict(const framework::Tensor &t,
                                             int block_id);
  std::map<framework::BlockDesc,
W
wangliu 已提交
78 79
           std::vector<std::shared_ptr<framework::OperatorBase<Dtype>>>>
      ops_of_block_;
80
  bool use_optimize_ = false;
xiebaiyuan's avatar
xiebaiyuan 已提交
81
  bool loddable_ = false;
D
dolphin8 已提交
82 83 84 85 86 87 88 89 90 91
#ifdef PADDLE_EXECUTOR_MULTITHREAD
  std::vector<depCore> depManager;
#endif
#ifdef PADDLE_MOBILE_PROFILE
  struct ProfInfo {
    int tid = 0;
    uint64_t runBegin = 0UL;
    uint64_t runEnd = 0UL;
  };
#endif
xiebaiyuan's avatar
xiebaiyuan 已提交
92 93 94 95

  bool varInputMemory(const std::shared_ptr<framework::VarDesc> &var_desc,
                      framework::Variable *var,
                      framework::LoDTensor *tensor) const;
96 97

#ifdef PADDLE_MOBILE_FPGA
98

99
 public:
100
  void InjectVariable(const framework::Tensor &t, string var_name);
101 102 103 104 105 106
  void FeedData(const framework::Tensor &t);
  std::shared_ptr<framework::Tensor> FetchResult();
  void Predict_From_To(int start = 0, int end = -1);
  void Predict_From(int start);
  void Predict_To(int end);
#endif
107 108
};

W
wangliu 已提交
109
}  // namespace paddle_mobile