executor.h 3.8 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
/* Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#pragma once

17 18 19
#include <map>
#include <memory>
#include <string>
20
#include <unordered_map>
21
#include <utility>
22
#include <vector>
23
#include "common/types.h"
Refine  
陈后江 已提交
24
#include "common/util.h"
L
liuruilong 已提交
25
#include "framework/lod_tensor.h"
L
liuruilong 已提交
26
#include "framework/operator.h"
27
#include "framework/program/program.h"
L
liuruilong 已提交
28
#include "framework/tensor.h"
29
#include "framework/type_trait.h"
30
#include "pass/memory_optimize.h"
31 32

namespace paddle_mobile {
33
namespace framework {
34

35
template <typename Device, typename T = float>
36
class Executor {
W
wangliu 已提交
37
 public:
xiebaiyuan's avatar
xiebaiyuan 已提交
38 39
  Executor(const Program<Device> &program,
           paddle_mobile::PaddleMobileConfigInternal config, int batch_size = 1,
40 41
           const bool use_optimize = true, const bool lod_mode = false);

42 43
  void SetThreadNum(int thread_num,
                    PowerMode power_mode = PERFORMANCE_PRIORITY);
44

45 46 47 48 49 50 51 52 53 54 55 56
  PMStatus Predict(const std::vector<std::pair<std::string, Tensor>> &inputs);
  PMStatus Predict(
      const std::vector<std::pair<std::string, LoDTensor>> &inputs);

  std::vector<T> Predict(const std::vector<T> &input,
                         const std::vector<int64_t> &dims);
  PMStatus Predict();

  void SetInput(const Tensor &input, const std::string &var_name);
  void SetInput(const LoDTensor &input, const std::string &var_name);

  std::shared_ptr<LoDTensor> GetOutput(const std::string &var_name);
57 58 59
#ifdef PADDLE_MOBILE_CL
  const CLImage *GetOutputImage(const std::string &var_name);
#endif
60

61 62 63
  void FeedTensorData(const std::vector<framework::Tensor> &v);
  void GetTensorResults(std::vector<framework::Tensor *> *v);

H
hjchen2 已提交
64
#ifdef PADDLE_MOBILE_FPGA
65 66
  void InjectVariable(const Tensor &t, std::string var_name);
  void FeedData(const Tensor &t);
67 68
  void FeedData(const std::vector<void *> &v);
  void GetResults(std::vector<void *> *v);
69
  framework::Tensor *GetTensorByName(const std::string &name);
70
  std::shared_ptr<Tensor> FetchResult(int id = -1);
H
hjchen2 已提交
71 72 73
  void Predict_From_To(int start = 0, int end = -1);
  void Predict_From(int start);
  void Predict_To(int end);
74 75 76
#ifdef PADDLE_MOBILE_FPGA_V2
  void InitQuantMemory();
#endif
H
hjchen2 已提交
77 78
#endif

W
wangliu 已提交
79
 protected:
80
  Executor() = default;
81

H
update  
hjchen2 已提交
82 83
  bool varInputMemory(const std::shared_ptr<VarDesc> &var_desc,
                      Variable *var) const;
84
  void InitFeedFetchList();
85
  void InitMemory();
L
liuruilong 已提交
86
  void InitCombineMemory();
Z
zhaojiaying01 已提交
87
  void InitNoPersistableMemory(const Tensor &input_tensor);
88 89
  void LoadMemory(void **data, const std::shared_ptr<VarDesc> var_desc,
                  LoDTensor *tensor);
L
liuruilong 已提交
90
#ifdef PADDLE_MOBILE_CL
91
  void LoadMemory(const VarDesc var_desc, float *tensorInput, char **data);
L
liuruilong 已提交
92
#endif
93 94 95 96

  int batch_size_;
  bool use_optimize_;
  bool lod_mode_;
L
liuruilong 已提交
97
  PaddleMobileConfigInternal config_;
98 99
  Program<Device> program_;
  std::shared_ptr<ProgramDesc> program_desc_;
100
  std::vector<std::shared_ptr<OperatorBase<Device>>> ops_of_block0_;
101 102
  std::unordered_map<std::string, int> feed_indices_;
  std::unordered_map<std::string, int> fetch_indices_;
103

104
  // for super resoltion
xiebaiyuan's avatar
xiebaiyuan 已提交
105
  DDim input_dim_last_;
106
  bool input_dim_has_changed_ = true;
L
liuruilong 已提交
107

D
dolphin8 已提交
108
#ifdef PADDLE_MOBILE_PROFILE
109 110
  typedef typename DtypeTensorTrait<Device>::gtype ProfileTensorType;

D
dolphin8 已提交
111 112 113 114 115
  struct ProfInfo {
    int tid = 0;
    uint64_t runBegin = 0UL;
    uint64_t runEnd = 0UL;
  };
116 117

  void PrintProfile(const vector<Executor<Device, T>::ProfInfo> &profile) const;
D
dolphin8 已提交
118
#endif
119 120
};

121
}  // namespace framework
W
wangliu 已提交
122
}  // namespace paddle_mobile