cxx_api_impl.cc 5.0 KB
Newer Older
Y
Yan Chunwei 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
// Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#include "lite/api/cxx_api.h"
16 17
#include <memory>
#include <mutex>  //NOLINT
18
#include <string>
Y
Yan Chunwei 已提交
19
#include "lite/api/paddle_api.h"
20
#include "lite/core/device_info.h"
21
#include "lite/core/version.h"
Y
Yan Chunwei 已提交
22

23 24 25 26 27 28
#if (defined LITE_WITH_X86) && (defined PADDLE_WITH_MKLML) && \
    !(defined LITE_ON_MODEL_OPTIMIZE_TOOL)
#include <omp.h>
#include "lite/backends/x86/mklml.h"
#endif

Y
Yan Chunwei 已提交
29 30 31 32
namespace paddle {
namespace lite {

void CxxPaddleApiImpl::Init(const lite_api::CxxConfig &config) {
33
  config_ = config;
34
  auto places = config.valid_places();
35
  std::vector<std::string> passes{};
36
#ifdef LITE_WITH_CUDA
37 38 39 40 41
  // if kCUDA is included in valid places, it should be initialized first,
  // otherwise skip this step.
  for (auto &p : places) {
    if (p.target == TARGET(kCUDA)) {
      Env<TARGET(kCUDA)>::Init();
42 43 44 45
      if (config_.multi_stream()) {
        passes = {"multi_stream_analysis_pass"};
        VLOG(3) << "add pass: " << passes[0];
      }
46 47 48
      break;
    }
  }
49
#endif
50 51 52 53 54 55 56 57 58
#ifdef LITE_WITH_MLU
  Env<TARGET(kMLU)>::Init();
  lite::DeviceInfo::Global().SetMLURunMode(config.mlu_core_version(),
                                           config.mlu_core_number(),
                                           config.mlu_use_first_conv(),
                                           config.mlu_first_conv_mean(),
                                           config.mlu_first_conv_std(),
                                           config.mlu_input_layout());
#endif  // LITE_WITH_MLU
59 60
  auto use_layout_preprocess_pass =
      config.model_dir().find("OPENCL_PRE_PRECESS");
61 62 63
  VLOG(1) << "use_layout_preprocess_pass:" << use_layout_preprocess_pass;
  if (places[0].target == TARGET(kOpenCL) &&
      use_layout_preprocess_pass != std::string::npos) {
64
    passes = {"type_layout_cast_preprocess_pass"};
65
    VLOG(1) << "add pass:" << passes[0];
66 67
  }
  raw_predictor_.Build(config, places, passes);
T
TianXiaogang 已提交
68 69
  mode_ = config.power_mode();
  threads_ = config.threads();
70 71 72

#if (defined LITE_WITH_X86) && (defined PADDLE_WITH_MKLML) && \
    !(defined LITE_ON_MODEL_OPTIMIZE_TOOL)
73
  int num_threads = config.x86_math_library_num_threads();
74 75 76
  int real_num_threads = num_threads > 1 ? num_threads : 1;
  paddle::lite::x86::MKL_Set_Num_Threads(real_num_threads);
  omp_set_num_threads(real_num_threads);
77
  VLOG(3) << "set_x86_math_library_math_threads() is set successfully and the "
78 79 80
             "number of threads is:"
          << num_threads;
#endif
Y
Yan Chunwei 已提交
81 82 83 84 85 86 87 88 89 90 91 92 93
}

std::unique_ptr<lite_api::Tensor> CxxPaddleApiImpl::GetInput(int i) {
  auto *x = raw_predictor_.GetInput(i);
  return std::unique_ptr<lite_api::Tensor>(new lite_api::Tensor(x));
}

std::unique_ptr<const lite_api::Tensor> CxxPaddleApiImpl::GetOutput(
    int i) const {
  const auto *x = raw_predictor_.GetOutput(i);
  return std::unique_ptr<lite_api::Tensor>(new lite_api::Tensor(x));
}

S
sangoly 已提交
94
std::vector<std::string> CxxPaddleApiImpl::GetInputNames() {
95 96 97
  return raw_predictor_.GetInputNames();
}

S
sangoly 已提交
98
std::vector<std::string> CxxPaddleApiImpl::GetOutputNames() {
99 100 101
  return raw_predictor_.GetOutputNames();
}

T
TianXiaogang 已提交
102 103 104 105 106 107
void CxxPaddleApiImpl::Run() {
#ifdef LITE_WITH_ARM
  lite::DeviceInfo::Global().SetRunMode(mode_, threads_);
#endif
  raw_predictor_.Run();
}
Y
Yan Chunwei 已提交
108

109 110 111 112 113 114 115
std::shared_ptr<lite_api::PaddlePredictor> CxxPaddleApiImpl::Clone() {
  std::lock_guard<std::mutex> lock(mutex_);
  auto predictor = std::make_shared<lite::CxxPaddleApiImpl>();
  predictor->Init(config_);
  return predictor;
}

116 117
std::string CxxPaddleApiImpl::GetVersion() const { return version(); }

Y
Yan Chunwei 已提交
118 119 120 121 122 123
std::unique_ptr<const lite_api::Tensor> CxxPaddleApiImpl::GetTensor(
    const std::string &name) const {
  auto *x = raw_predictor_.GetTensor(name);
  return std::unique_ptr<const lite_api::Tensor>(new lite_api::Tensor(x));
}

124 125 126 127 128 129
std::unique_ptr<lite_api::Tensor> CxxPaddleApiImpl::GetInputByName(
    const std::string &name) {
  return std::unique_ptr<lite_api::Tensor>(
      new lite_api::Tensor(raw_predictor_.GetInputByName(name)));
}

Y
Yan Chunwei 已提交
130
void CxxPaddleApiImpl::SaveOptimizedModel(const std::string &model_dir,
131 132 133
                                          lite_api::LiteModelType model_type,
                                          bool record_info) {
  raw_predictor_.SaveModel(model_dir, model_type, record_info);
Y
Yan Chunwei 已提交
134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149
}

}  // namespace lite

namespace lite_api {

template <>
std::shared_ptr<PaddlePredictor> CreatePaddlePredictor(
    const CxxConfig &config) {
  auto x = std::make_shared<lite::CxxPaddleApiImpl>();
  x->Init(config);
  return x;
}

}  // namespace lite_api
}  // namespace paddle