ir_graph_build_pass.cc 4.7 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
// Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#include "paddle/fluid/inference/analysis/passes/ir_graph_build_pass.h"
16

17
#include <memory>
18
#include <string>
19

20
#include "paddle/fluid/framework/executor.h"
21
#include "paddle/fluid/framework/ir/fuse_pass_base.h"
22 23 24 25 26 27 28 29 30 31 32 33 34 35
#include "paddle/fluid/inference/io.h"
#include "paddle/fluid/platform/enforce.h"

namespace paddle {
namespace inference {

extern void ReadBinaryFile(const std::string &filename, std::string *contents);

namespace analysis {

void IrGraphBuildPass::RunImpl(Argument *argument) {
  if (!argument->scope_valid()) {
    argument->SetScope(new framework::Scope);
  }
36 37 38
  PADDLE_ENFORCE_EQ(argument->use_gpu_valid(), true,
                    platform::errors::PreconditionNotMet(
                        "The use_gpu field should be valid"));
S
superjomn 已提交
39 40 41 42 43

  // The load program should run on the same device with the inference program,
  // so that the parameters will on the same device, or they will keep copying
  // between difference devices.
  platform::Place place;
N
nhzlx 已提交
44
  place = platform::CPUPlace();
45 46

  if (argument->model_dir_valid()) {
S
superjomn 已提交
47 48
    auto program =
        LoadModel(argument->model_dir(), argument->scope_ptr(), place);
49 50 51
    argument->SetMainProgram(program.release());
  } else if (argument->model_program_path_valid() &&
             argument->model_params_path_valid()) {
S
superjomn 已提交
52 53 54 55
    auto program = LoadModel(
        argument->model_program_path(), argument->model_params_path(),
        argument->scope_ptr(), place,
        argument->model_from_memory_valid() && argument->model_from_memory());
56 57
    argument->SetMainProgram(program.release());
  } else {
58 59 60
    PADDLE_THROW(platform::errors::PreconditionNotMet(
        "either model_dir or (program path and parameter path) should be "
        "set."));
61 62 63 64
  }

  auto graph = std::unique_ptr<Graph>(new Graph(argument->main_program()));
  argument->SetMainGraph(graph.release());
65
  auto *scope_ptr = argument->scope_ptr();
66 67 68
  PADDLE_ENFORCE_NOT_NULL(scope_ptr,
                          platform::errors::PreconditionNotMet(
                              "The scope ptr should not be nullptr."));
69
  argument->main_graph().SetNotOwned(framework::ir::kParamScopeAttr, scope_ptr);
J
jianghaicheng 已提交
70 71 72 73 74 75 76

// ipu related
#ifdef PADDLE_WITH_IPU
  if (argument->Has("use_ipu")) {
    if (argument->use_ipu()) {
      argument->main_graph().SetNotOwned("num_ipus",
                                         &argument->ipu_device_num());
77 78
      argument->main_graph().SetNotOwned("micro_batch_size",
                                         &argument->ipu_micro_batch_size());
J
jianghaicheng 已提交
79 80 81 82
      argument->main_graph().SetNotOwned("enable_pipelining",
                                         &argument->ipu_enable_pipelining());
      argument->main_graph().SetNotOwned("batches_per_step",
                                         &argument->ipu_batches_per_step());
83 84 85 86 87 88 89 90 91
      argument->main_graph().SetNotOwned("enable_fp16",
                                         &argument->ipu_enable_fp16());
      argument->main_graph().SetNotOwned("replica_num",
                                         &argument->ipu_replica_num());
      argument->main_graph().SetNotOwned(
          "available_memory_proportion",
          &argument->ipu_available_memory_proportion());
      argument->main_graph().SetNotOwned("enable_half_partial",
                                         &argument->ipu_enable_half_partial());
J
jianghaicheng 已提交
92 93 94
    }
  }
#endif
95 96 97
}

std::unique_ptr<framework::ProgramDesc> IrGraphBuildPass::LoadModel(
S
superjomn 已提交
98 99
    const std::string &path, framework::Scope *scope,
    const platform::Place &place) {
100 101 102 103 104 105
  framework::Executor exe(place);
  return Load(&exe, scope, path);
}

std::unique_ptr<framework::ProgramDesc> IrGraphBuildPass::LoadModel(
    const std::string &program_path, const std::string &params_path,
T
Tao Luo 已提交
106
    framework::Scope *scope, const platform::Place &place,
T
Tao Luo 已提交
107
    bool model_from_memory) {
108
  framework::Executor exe(place);
T
Tao Luo 已提交
109 110 111 112 113
  if (!model_from_memory) {
    return Load(&exe, scope, program_path, params_path);
  } else {
    return LoadFromMemory(&exe, scope, program_path, params_path);
  }
114 115 116 117 118 119 120
}

std::string IrGraphBuildPass::repr() const { return "ir-graph-build-pass"; }

}  // namespace analysis
}  // namespace inference
}  // namespace paddle