ir_graph_build_pass.cc 5.1 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
// Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#include "paddle/fluid/inference/analysis/passes/ir_graph_build_pass.h"
16

17
#include <memory>
18
#include <string>
19

20
#include "paddle/fluid/framework/executor.h"
21
#include "paddle/fluid/framework/ir/fuse_pass_base.h"
22 23 24 25 26 27 28 29 30 31 32 33 34 35
#include "paddle/fluid/inference/io.h"
#include "paddle/fluid/platform/enforce.h"

namespace paddle {
namespace inference {

extern void ReadBinaryFile(const std::string &filename, std::string *contents);

namespace analysis {

void IrGraphBuildPass::RunImpl(Argument *argument) {
  if (!argument->scope_valid()) {
    argument->SetScope(new framework::Scope);
  }
36 37
  PADDLE_ENFORCE_EQ(argument->use_gpu_valid(),
                    true,
38 39
                    platform::errors::PreconditionNotMet(
                        "The use_gpu field should be valid"));
S
superjomn 已提交
40 41 42 43 44

  // The load program should run on the same device with the inference program,
  // so that the parameters will on the same device, or they will keep copying
  // between difference devices.
  platform::Place place;
N
nhzlx 已提交
45
  place = platform::CPUPlace();
46 47

  if (argument->model_dir_valid()) {
S
superjomn 已提交
48 49
    auto program =
        LoadModel(argument->model_dir(), argument->scope_ptr(), place);
50 51 52
    argument->SetMainProgram(program.release());
  } else if (argument->model_program_path_valid() &&
             argument->model_params_path_valid()) {
S
superjomn 已提交
53
    auto program = LoadModel(
54 55 56 57
        argument->model_program_path(),
        argument->model_params_path(),
        argument->scope_ptr(),
        place,
58 59
        argument->model_from_memory_valid() && argument->model_from_memory(),
        argument->skip_load_params());
60 61
    argument->SetMainProgram(program.release());
  } else {
62 63 64
    PADDLE_THROW(platform::errors::PreconditionNotMet(
        "either model_dir or (program path and parameter path) should be "
        "set."));
65 66 67 68
  }

  auto graph = std::unique_ptr<Graph>(new Graph(argument->main_program()));
  argument->SetMainGraph(graph.release());
69
  auto *scope_ptr = argument->scope_ptr();
70 71 72
  PADDLE_ENFORCE_NOT_NULL(scope_ptr,
                          platform::errors::PreconditionNotMet(
                              "The scope ptr should not be nullptr."));
73
  argument->main_graph().SetNotOwned(framework::ir::kParamScopeAttr, scope_ptr);
J
jianghaicheng 已提交
74 75 76 77 78 79 80

// ipu related
#ifdef PADDLE_WITH_IPU
  if (argument->Has("use_ipu")) {
    if (argument->use_ipu()) {
      argument->main_graph().SetNotOwned("num_ipus",
                                         &argument->ipu_device_num());
81 82
      argument->main_graph().SetNotOwned("micro_batch_size",
                                         &argument->ipu_micro_batch_size());
J
jianghaicheng 已提交
83 84 85 86
      argument->main_graph().SetNotOwned("enable_pipelining",
                                         &argument->ipu_enable_pipelining());
      argument->main_graph().SetNotOwned("batches_per_step",
                                         &argument->ipu_batches_per_step());
87 88 89 90 91 92 93 94 95
      argument->main_graph().SetNotOwned("enable_fp16",
                                         &argument->ipu_enable_fp16());
      argument->main_graph().SetNotOwned("replica_num",
                                         &argument->ipu_replica_num());
      argument->main_graph().SetNotOwned(
          "available_memory_proportion",
          &argument->ipu_available_memory_proportion());
      argument->main_graph().SetNotOwned("enable_half_partial",
                                         &argument->ipu_enable_half_partial());
96 97 98 99
      argument->main_graph().SetNotOwned("custom_ops_info",
                                         &argument->ipu_custom_ops_info());
      argument->main_graph().SetNotOwned("custom_patterns",
                                         &argument->ipu_custom_patterns());
J
jianghaicheng 已提交
100 101 102
    }
  }
#endif
103 104 105
}

std::unique_ptr<framework::ProgramDesc> IrGraphBuildPass::LoadModel(
106 107
    const std::string &path,
    framework::Scope *scope,
S
superjomn 已提交
108
    const platform::Place &place) {
109 110 111 112 113
  framework::Executor exe(place);
  return Load(&exe, scope, path);
}

std::unique_ptr<framework::ProgramDesc> IrGraphBuildPass::LoadModel(
114 115 116 117
    const std::string &program_path,
    const std::string &params_path,
    framework::Scope *scope,
    const platform::Place &place,
118 119
    bool model_from_memory,
    bool skip_load_params) {
120
  framework::Executor exe(place);
T
Tao Luo 已提交
121
  if (!model_from_memory) {
122
    return Load(&exe, scope, program_path, params_path, !skip_load_params);
T
Tao Luo 已提交
123 124 125
  } else {
    return LoadFromMemory(&exe, scope, program_path, params_path);
  }
126 127 128 129 130 131 132
}

std::string IrGraphBuildPass::repr() const { return "ir-graph-build-pass"; }

}  // namespace analysis
}  // namespace inference
}  // namespace paddle