cxx_api.cc 13.4 KB
Newer Older
Y
Yan Chunwei 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
// Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#include "lite/api/cxx_api.h"
16
#include <algorithm>
Y
Yan Chunwei 已提交
17
#include <memory>
18
#include <set>
Y
Yan Chunwei 已提交
19 20 21
#include <string>
#include <utility>
#include <vector>
22
#include "lite/api/paddle_use_passes.h"
Y
Yan Chunwei 已提交
23 24 25 26 27 28
#include "lite/utils/io.h"

namespace paddle {
namespace lite {

void Predictor::SaveModel(const std::string &dir,
29 30
                          lite_api::LiteModelType model_type,
                          bool record_info) {
Y
Yan Chunwei 已提交
31 32 33
  if (!program_) {
    GenRuntimeProgram();
  }
34 35
  program_->SaveOpInfosToProgram(program_desc_.get());
  program_->UpdateVarsOfProgram(program_desc_.get());
Y
Yan Chunwei 已提交
36 37
  switch (model_type) {
    case lite_api::LiteModelType::kProtobuf:
38
      SaveModelPb(dir, *program_->exec_scope(), *program_desc_.get(), true);
Y
Yan Chunwei 已提交
39 40
      break;
    case lite_api::LiteModelType::kNaiveBuffer:
41
      SaveModelNaive(dir, *program_->exec_scope(), *program_desc_.get());
Y
Yan Chunwei 已提交
42 43 44 45
      break;
    default:
      LOG(FATAL) << "Unknown model type";
  }
46
  if (record_info) {
47
    MkDirRecur(dir);
48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123
    SaveOpKernelInfo(dir);
  }
}

void Predictor::SaveOpKernelInfo(const std::string &model_dir) {
  std::set<std::string> ops_info;
  std::set<std::string> kernels_info;
  const auto &instructions_ = program_->instructions();
  for (auto &node : instructions_) {
    // parse op type infomation
    auto op = node.op()->op_info();
    ops_info.insert(op->Type());
    // parse kernel type information
    std::string kernel_type_str =
        node.kernel()->op_type() + "," + TargetRepr(node.kernel()->target()) +
        "," + PrecisionRepr(node.kernel()->precision()) + "," +
        DataLayoutRepr(node.kernel()->layout()) + "," + node.kernel()->alias();
    kernels_info.insert(kernel_type_str);
  }

  // get souce_file name from op type and kernel type
  auto op2pathmap = OpKernelInfoCollector::Global().GetOp2PathDict();
  auto kernel2pathmap = OpKernelInfoCollector::Global().GetKernel2PathDict();

  // write used op and kernel info into files
  std::string opf_path = model_dir + "/" + TAILORD_OPS_LIST_NAME;
  std::string opf_source_path =
      model_dir + "/" + TAILORD_OPS_SOURCE_LIST_FILENAME;
  std::string kpf_path = model_dir + "/" + TAILORD_KERNELS_LIST_NAME;
  std::string kpf_source_path =
      model_dir + "/" + TAILORD_KERNELS_SOURCE_LIST_FILENAME;
  std::map<std::string, std::string> op2path;

  std::FILE *opf = std::fopen(opf_path.c_str(), "w");
  std::FILE *opf_source = std::fopen(opf_source_path.c_str(), "w");
  std::FILE *kpf = std::fopen(kpf_path.c_str(), "w");
  std::FILE *kpf_source = std::fopen(kpf_source_path.c_str(), "w");
  std::vector<std::string> opcompile;
  std::vector<std::string> kernelcompile;

  if (nullptr == opf || nullptr == opf_source || nullptr == opf ||
      nullptr == kpf_source) {
    LOG(FATAL) << "failed to create info file into: " << model_dir;
  }
  for (auto op_info = ops_info.begin(); op_info != ops_info.end(); op_info++) {
    fputs(op_info->c_str(), opf);
    fputc('\n', opf);
    std::string op_path = op2pathmap[*op_info];
    fputs(op_path.c_str(), opf_source);
    fputc('\n', opf_source);
  }
  std::fclose(opf_source);
  std::fclose(opf);
  LOG(INFO) << "operators information of tailored model is stored into: "
            << opf_path;

  // write Kernel_type and Kernel_path into file
  for (auto kernel_info = kernels_info.begin();
       kernel_info != kernels_info.end();
       kernel_info++) {
    fputs(kernel_info->c_str(), kpf);
    fputc('\n', kpf);
    std::string kernel_path = kernel2pathmap[*kernel_info];
    fputs(kernel_path.c_str(), kpf_source);
    fputc('\n', kpf_source);
    if (kernel_path == "conv_compute.cc") {
      fputs(
          "conv_depthwise.cc\nconv_direct.cc\nconv_gemmlike.cc\nconv_"
          "winograd.cc\n",
          kpf_source);
    }
  }
  std::fclose(kpf_source);
  std::fclose(kpf);
  LOG(INFO) << "kernels information of tailored model is stored into: "
            << kpf_path;
Y
Yan Chunwei 已提交
124 125
}

126
#ifndef LITE_WITH_FPGA
Y
Yan Chunwei 已提交
127
lite::Tensor *Predictor::GetInput(size_t offset) {
128 129 130 131 132 133 134
  CHECK(input_names_.size() > offset)
      << "The network has " << input_names_.size() << " inputs"
      << ", the offset should be less than this.";
  auto *in_var = exec_scope_->FindVar(input_names_[offset]);
  CHECK(in_var) << "no fatch variable " << input_names_[offset]
                << " in exec_scope";
  return in_var->GetMutable<lite::Tensor>();
Y
Yan Chunwei 已提交
135
}
136 137 138 139 140 141 142 143 144 145 146
#else
lite::Tensor *Predictor::GetInput(size_t offset) {
  auto *_feed_list = exec_scope_->FindVar("feed");
  CHECK(_feed_list) << "no feed variable in exec_scope";
  auto *feed_list = _feed_list->GetMutable<std::vector<lite::Tensor>>();
  if (offset >= feed_list->size()) {
    feed_list->resize(offset + 1);
  }
  return &feed_list->at(offset);
}
#endif
Y
Yan Chunwei 已提交
147

148
// get inputs names
S
sangoly 已提交
149
std::vector<std::string> Predictor::GetInputNames() { return input_names_; }
150

151
// get outputnames
S
sangoly 已提交
152
std::vector<std::string> Predictor::GetOutputNames() { return output_names_; }
153

154 155 156 157 158
// get param names
std::vector<std::string> Predictor::GetParamNames() {
  return exec_scope_->AttributeVarNames();
}

159 160
// append the names of inputs and outputs into input_names_ and output_names_
void Predictor::PrepareFeedFetch() {
161 162 163
  if (!program_) {
    GenRuntimeProgram();
  }
164 165 166

  std::vector<const cpp::OpDesc *> feeds;
  std::vector<const cpp::OpDesc *> fetchs;
167 168 169
  const auto &insts = program_->instructions();
  for (size_t i = 0; i < program_->num_instructions(); i++) {
    const auto &op = insts[i].op()->op_info();
170
    if (op->Type() == "feed") {
171
      feeds.push_back(op);
172
    } else if (op->Type() == "fetch") {
173
      fetchs.push_back(op);
174 175
    }
  }
176

177 178
  input_names_.resize(feeds.size());
  output_names_.resize(fetchs.size());
179
  for (size_t i = 0; i < feeds.size(); i++) {
180 181 182
    input_names_[feeds[i]->GetAttr<int>("col")] =
        feeds[i]->Output("Out").front();
  }
183
  for (size_t i = 0; i < fetchs.size(); i++) {
184 185 186
    output_names_[fetchs[i]->GetAttr<int>("col")] =
        fetchs[i]->Input("X").front();
  }
187 188
}

189 190
#ifndef LITE_WITH_FPGA

Y
Yan Chunwei 已提交
191
const lite::Tensor *Predictor::GetOutput(size_t offset) const {
192 193 194 195 196 197 198
  CHECK(output_names_.size() > offset)
      << "The network has " << output_names_.size() << " outputs"
      << ", the offset should be less than this.";
  const std::string name = output_names_.at(offset);
  auto *out_var = exec_scope_->FindVar(name);
  CHECK(out_var) << "no fatch variable " << name << " in exec_scope";
  return out_var->GetMutable<lite::Tensor>();
Y
Yan Chunwei 已提交
199 200
}

201 202 203 204 205 206 207 208
std::vector<const lite::Tensor *> Predictor::GetOutputs() const {
  std::vector<const lite::Tensor *> outputs;
  size_t out_size = output_names_.size();
  for (size_t i = 0; i < out_size; i++) {
    const std::string name = output_names_.at(i);
    outputs.push_back(GetTensor(name));
  }
  return outputs;
T
TianXiaogang 已提交
209
}
210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232
#else

const lite::Tensor *Predictor::GetOutput(size_t offset) const {
  auto *_fetch_list = exec_scope_->FindVar("fetch");
  CHECK(_fetch_list) << "no fatch variable in exec_scope";
  auto &fetch_list = *_fetch_list->GetMutable<std::vector<lite::Tensor>>();
  CHECK_LT(offset, fetch_list.size()) << "offset " << offset << " overflow";
  return &fetch_list.at(offset);
}

std::vector<const lite::Tensor *> Predictor::GetOutputs() const {
  auto *_fetch_list = exec_scope_->FindVar("fetch");
  CHECK(_fetch_list) << "no fatch variable in exec_scope";
  auto &fetch_list = *_fetch_list->GetMutable<std::vector<lite::Tensor>>();

  std::vector<const lite::Tensor *> outputs;
  for (auto out : fetch_list) {
    outputs.push_back(&out);
  }
  return outputs;
}

#endif
T
TianXiaogang 已提交
233

Y
Yan Chunwei 已提交
234
const cpp::ProgramDesc &Predictor::program_desc() const {
235
  return *program_desc_.get();
Y
Yan Chunwei 已提交
236 237 238
}
const RuntimeProgram &Predictor::runtime_program() const { return *program_; }

239 240 241 242 243 244 245 246
void Predictor::Build(const lite_api::CxxConfig &config,
                      const std::vector<Place> &valid_places,
                      const std::vector<std::string> &passes,
                      lite_api::LiteModelType model_type) {
  const std::string &model_path = config.model_dir();
  const std::string &model_file = config.model_file();
  const std::string &param_file = config.param_file();
  const bool model_from_memory = config.model_from_memory();
247 248 249 250 251
  if (model_from_memory) {
    LOG(INFO) << "Load model from memory.";
  } else {
    LOG(INFO) << "Load model from file.";
  }
252 253 254 255 256 257 258 259 260

  Build(model_path,
        model_file,
        param_file,
        valid_places,
        passes,
        model_type,
        model_from_memory);
}
Y
Yan Chunwei 已提交
261
void Predictor::Build(const std::string &model_path,
262 263
                      const std::string &model_file,
                      const std::string &param_file,
Y
Yan Chunwei 已提交
264 265
                      const std::vector<Place> &valid_places,
                      const std::vector<std::string> &passes,
266 267
                      lite_api::LiteModelType model_type,
                      bool model_from_memory) {
Y
Yan Chunwei 已提交
268
  switch (model_type) {
269 270 271 272 273 274 275 276 277
    case lite_api::LiteModelType::kProtobuf: {
      bool combined_param = false;
      if (!model_file.empty() && !param_file.empty()) {
        combined_param = true;
      }
      LoadModelPb(model_path,
                  model_file,
                  param_file,
                  scope_.get(),
278
                  program_desc_.get(),
279 280
                  combined_param,
                  model_from_memory);
281
    } break;
Y
Yan Chunwei 已提交
282
    case lite_api::LiteModelType::kNaiveBuffer:
283 284
      CHECK(!model_path.empty())
          << "NaiveBuffer backend only supported combined param";
285
      LoadModelNaiveFromFile(model_path, scope_.get(), program_desc_.get());
Y
Yan Chunwei 已提交
286 287 288 289
      break;
    default:
      LOG(FATAL) << "Unknown model type";
  }
290
  Build(program_desc_, valid_places, passes);
Y
Yan Chunwei 已提交
291 292
}

293
void Predictor::Build(const std::shared_ptr<cpp::ProgramDesc> &desc,
Y
Yan Chunwei 已提交
294 295 296
                      const std::vector<Place> &valid_places,
                      const std::vector<std::string> &passes) {
  program_desc_ = desc;
297
  // `inner_places` is used to optimize passes
298
  std::vector<Place> inner_places = valid_places;
299
  for (auto &valid_place : valid_places) {
300
    if (valid_place.target == TARGET(kOpenCL)) continue;
301 302 303
    inner_places.emplace_back(
        Place(TARGET(kHost), valid_place.precision, valid_place.layout));
  }
304

305 306
  // Analysis whether the modle is quantized.
  // For quantized model, add place(arm, int8) to inner_places
307 308 309 310 311 312 313 314
  const std::vector<std::string> quant_dequant_op = {
      "fake_quantize_abs_max",
      "fake_quantize_range_abs_max",
      "fake_quantize_moving_average_abs_max",
      "fake_quantize_dequantize_moving_average_abs_max",
      "fake_dequantize_max_abs",
      "fake_channel_wise_dequantize_max_abs"};
  bool is_quantized_model = false;
315
  for (size_t i = 0; i < program_desc_->BlocksSize() && !is_quantized_model;
316
       ++i) {
317
    auto *block_desc = program_desc_->GetBlock<cpp::BlockDesc>(i);
318 319 320 321 322 323 324 325 326 327 328
    for (size_t j = 0; j < block_desc->OpsSize() && !is_quantized_model; ++j) {
      auto *op_desc = block_desc->GetOp<cpp::OpDesc>(j);
      std::string op_type = op_desc->Type();
      if (std::find(quant_dequant_op.begin(),
                    quant_dequant_op.end(),
                    op_type) != quant_dequant_op.end()) {
        is_quantized_model = true;
      }
    }
  }
  if (is_quantized_model) {
329
#ifdef LITE_WITH_ARM
330 331
    inner_places.insert(inner_places.begin(),
                        Place{TARGET(kARM), PRECISION(kInt8)});
332
#endif
333 334
  }

335 336
  Program program(*desc.get(), scope_, inner_places);
  valid_places_ = inner_places;
337

Y
Yan Chunwei 已提交
338 339 340
  core::KernelPickFactor factor;
  factor.ConsiderTarget();
  factor.ConsiderPrecision();
341
  factor.ConsiderDataLayout();
342

343
  optimizer_.Run(std::move(program), inner_places, factor, passes);
Y
Yan Chunwei 已提交
344
  exec_scope_ = optimizer_.exec_scope();
345
  PrepareFeedFetch();
Y
Yan Chunwei 已提交
346 347 348 349 350 351 352 353 354 355
}

void Predictor::GenRuntimeProgram() {
  program_ = optimizer_.GenRuntimeProgram();
  CHECK_EQ(exec_scope_, program_->exec_scope());
  program_generated_ = true;
}

const lite::Tensor *Predictor::GetTensor(const std::string &name) const {
  auto *var = exec_scope_->FindVar(name);
356
  CHECK(var) << "no variable named with " << name << " in exec_scope";
Y
Yan Chunwei 已提交
357 358
  return &var->Get<lite::Tensor>();
}
359

360 361 362 363 364 365
lite::Tensor *Predictor::GetMutableTensor(const std::string &name) {
  auto *var = exec_scope_->FindVar(name);
  CHECK(var) << "no variable named with " << name << " in exec_scope";
  return var->GetMutable<lite::Tensor>();
}

366 367
// get input by name
lite::Tensor *Predictor::GetInputByName(const std::string &name) {
368 369
  auto element = std::find(input_names_.begin(), input_names_.end(), name);
  if (element == input_names_.end()) {
370 371
    LOG(ERROR) << "Model do not have input named with: [" << name
               << "], model's inputs include:";
372
    for (size_t i = 0; i < input_names_.size(); i++) {
373 374
      LOG(ERROR) << "[" << input_names_[i] << "]";
    }
375
    return nullptr;
376
  } else {
377 378
    int position = std::distance(input_names_.begin(), element);
    return GetInput(position);
379 380
  }
}
Y
Yan Chunwei 已提交
381

M
mapingshuo 已提交
382 383 384 385 386 387 388 389 390 391
// #ifdef LITE_WITH_TRAIN
// void Predictor::FeedVars(const std::vector<framework::Tensor> &tensors) {
//   auto var = scope_->FindVar("feed");
//   auto &feed_list = *(var->GetMutable<std::vector<lite::Tensor>>());
//   feed_list.resize(tensors.size());

//   for (size_t i = 0; i < tensors.size(); ++i)
//     feed_list[i].ShareDataWith(tensors[i]);
// }
// #endif
Y
Yan Chunwei 已提交
392 393 394

}  // namespace lite
}  // namespace paddle