model_optimize_tool.cc 5.0 KB
Newer Older
Y
Yan Chunwei 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18
// Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#include <gflags/gflags.h>
#ifdef PADDLE_WITH_TESTING
#include <gtest/gtest.h>
#endif
19 20
// "all_kernel_faked.cc" and "kernel_src_map.h" are created automatically during
// model_optimize_tool's compiling period
21
#include "all_kernel_faked.cc"  // NOLINT
22
#include "kernel_src_map.h"     // NOLINT
Y
Yan Chunwei 已提交
23 24 25
#include "lite/api/paddle_api.h"
#include "lite/api/paddle_use_ops.h"
#include "lite/api/paddle_use_passes.h"
26
#include "lite/core/op_registry.h"
Y
Yan Chunwei 已提交
27 28 29
#include "lite/utils/cp_logging.h"
#include "lite/utils/string.h"

30 31 32 33 34 35
DEFINE_string(model_dir,
              "",
              "path of the model. This option will be ignored if model_file "
              "and param_file are exist");
DEFINE_string(model_file, "", "model file path of the combined-param model");
DEFINE_string(param_file, "", "param file path of the combined-param model");
Y
Yan Chunwei 已提交
36 37 38 39
DEFINE_string(
    optimize_out_type,
    "protobuf",
    "store type of the output optimized model. protobuf/naive_buffer");
40
DEFINE_bool(display_kernels, false, "Display kernel information");
41 42 43 44 45
DEFINE_bool(record_tailoring_info,
            false,
            "Record kernels and operators information of the optimized model "
            "for tailoring compiling, information are stored into optimized "
            "model path as hidden files");
Y
Yan Chunwei 已提交
46 47 48 49 50
DEFINE_string(optimize_out, "", "path of the output optimized model");
DEFINE_string(valid_targets,
              "arm",
              "The targets this model optimized for, should be one of (arm, "
              "opencl, x86), splitted by space");
51
DEFINE_bool(prefer_int8_kernel, false, "Prefer to run model with int8 kernels");
Y
Yan Chunwei 已提交
52 53 54 55

namespace paddle {
namespace lite_api {

56 57 58 59 60
//! Display the kernel information.
void DisplayKernels() {
  LOG(INFO) << ::paddle::lite::KernelRegistry::Global().DebugString();
}

Y
Yan Chunwei 已提交
61
void Main() {
62 63 64 65 66
  if (!FLAGS_model_file.empty() && !FLAGS_param_file.empty()) {
    LOG(WARNING)
        << "Load combined-param model. Option model_dir will be ignored";
  }

67 68 69 70 71
  if (FLAGS_display_kernels) {
    DisplayKernels();
    exit(0);
  }

Y
Yan Chunwei 已提交
72 73
  lite_api::CxxConfig config;
  config.set_model_dir(FLAGS_model_dir);
74 75
  config.set_model_file(FLAGS_model_file);
  config.set_param_file(FLAGS_param_file);
Y
Yan Chunwei 已提交
76 77 78 79 80 81 82

  std::vector<Place> valid_places;
  auto target_reprs = lite::Split(FLAGS_valid_targets, " ");
  for (auto& target_repr : target_reprs) {
    if (target_repr == "arm") {
      valid_places.emplace_back(TARGET(kARM));
    } else if (target_repr == "opencl") {
83 84 85 86 87 88 89 90 91 92
      valid_places.emplace_back(
          Place{TARGET(kOpenCL), PRECISION(kFP16), DATALAYOUT(kNCHW)});
      valid_places.emplace_back(
          Place{TARGET(kOpenCL), PRECISION(kFP16), DATALAYOUT(kNHWC)});
      valid_places.emplace_back(
          Place{TARGET(kOpenCL), PRECISION(kFloat), DATALAYOUT(kNCHW)});
      valid_places.emplace_back(
          Place{TARGET(kOpenCL), PRECISION(kFloat), DATALAYOUT(kNHWC)});
      valid_places.emplace_back(
          TARGET(kARM));  // enable kARM CPU kernel when no opencl kernel
Y
Yan Chunwei 已提交
93 94 95 96 97 98 99 100 101 102 103 104 105
    } else if (target_repr == "x86") {
      valid_places.emplace_back(TARGET(kX86));
    } else {
      LOG(FATAL) << lite::string_format(
          "Wrong target '%s' found, please check the command flag "
          "'valid_targets'",
          target_repr.c_str());
    }
  }

  CHECK(!valid_places.empty())
      << "At least one target should be set, should set the "
         "command argument 'valid_targets'";
106

107
  if (FLAGS_prefer_int8_kernel) {
Y
Yan Chunwei 已提交
108
    LOG(WARNING) << "Int8 mode is only support by ARM target";
109 110
    valid_places.insert(valid_places.begin(),
                        Place{TARGET(kARM), PRECISION(kInt8)});
Y
Yan Chunwei 已提交
111 112 113 114 115 116 117 118 119 120 121 122 123
  }
  config.set_valid_places(valid_places);

  auto predictor = lite_api::CreatePaddlePredictor(config);

  LiteModelType model_type;
  if (FLAGS_optimize_out_type == "protobuf") {
    model_type = LiteModelType::kProtobuf;
  } else if (FLAGS_optimize_out_type == "naive_buffer") {
    model_type = LiteModelType::kNaiveBuffer;
  } else {
    LOG(FATAL) << "Unsupported Model type :" << FLAGS_optimize_out_type;
  }
124
  OpKernelInfoCollector::Global().SetKernel2path(kernel2path_map);
Y
Yan Chunwei 已提交
125

126 127 128 129 130 131
  predictor->SaveOptimizedModel(
      FLAGS_optimize_out, model_type, FLAGS_record_tailoring_info);
  if (FLAGS_record_tailoring_info) {
    LOG(INFO) << "Record the information of tailored model into :"
              << FLAGS_optimize_out;
  }
Y
Yan Chunwei 已提交
132 133 134 135 136 137 138 139 140 141
}

}  // namespace lite_api
}  // namespace paddle

int main(int argc, char** argv) {
  google::ParseCommandLineFlags(&argc, &argv, false);
  paddle::lite_api::Main();
  return 0;
}