serializer.cc 4.8 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#include "paddle/fluid/jit/serializer.h"

17 18
#include <set>

19 20
#include "paddle/fluid/framework/var_desc.h"
#include "paddle/fluid/framework/variable.h"
21 22
#include "paddle/fluid/platform/device_context.h"

23 24
#include "paddle/fluid/jit/engine/executor_engine.h"
#include "paddle/fluid/jit/engine/pe_engine.h"
25 26
#include "paddle/fluid/jit/layer.h"
#include "paddle/fluid/jit/property.h"
27 28
#include "paddle/fluid/jit/serializer_utils.h"

29 30
DECLARE_string(jit_engine_type);

31 32
namespace paddle {
namespace jit {
33 34
using Name2FunctionInfoMap =
    std::unordered_map<std::string, std::shared_ptr<FunctionInfo>>;
35 36 37
Layer Deserializer::operator()(const std::string& path,
                               const phi::Place& place) {
  const auto& pdmodel_paths = utils::PdmodelFilePaths(path);
38 39
  // set is ordered
  std::set<std::string> param_names_set;
40
  Name2FunctionInfoMap info_map;
41
  for (auto& it : pdmodel_paths) {
42
    auto& func_name = it.first;
43
    auto program_desc = LoadProgram(it.second);
44

45 46
    std::vector<std::string> persist_var_names;
    auto all_var_desc = program_desc.Block(0).AllVars();
47
    for (auto* desc_ptr : all_var_desc) {
48
      if (utils::IsPersistable(desc_ptr)) {
49
        persist_var_names.emplace_back(desc_ptr->Name());
50 51 52
      }
    }

53
    param_names_set.insert(persist_var_names.begin(), persist_var_names.end());
54 55
    info_map[func_name] = std::make_shared<FunctionInfo>(
        func_name, persist_var_names, program_desc);
56 57
  }

58 59
  Name2VariableMap params_dict;
  Name2VariableMap attrs_dict;
60
  ReadTensorData(path + PDPARAMS_SUFFIX, param_names_set, place, &params_dict);
61

62 63 64 65 66
  if (utils::FileExists(path + PROPERTY_SUFFIX)) {
    ReadAttributeData(path + PROPERTY_SUFFIX, &attrs_dict);
    VLOG(3) << "Read Property Success!";
  }

67
  Layer layer = Layer(params_dict, attrs_dict, info_map, place);
68

69 70 71
  for (auto it = info_map.begin(); it != info_map.end(); ++it) {
    const std::string& func_name = it->first;
    auto& info = it->second;
72
    if (FLAGS_jit_engine_type == "Executor") {
73 74 75 76 77
      VLOG(3) << "Add function type: ExecutorEngine. Function name: "
              << func_name;
      layer.SetEngine(
          func_name,
          utils::MakeEngine<ExecutorEngine>(info, params_dict, place));
78
    } else if (FLAGS_jit_engine_type == "PE") {
79 80 81
      VLOG(3) << "Add function type: PEEngine. Function name: " << func_name;
      layer.SetEngine(func_name,
                      utils::MakeEngine<PEEngine>(info, params_dict, place));
82
    } else {
83
      PD_THROW("Invalid JitLayer engine type.");
84
    }
85 86
  }

87
  return layer;
88 89
}

90 91 92
void Deserializer::ReadTensorData(const std::string& file_name,
                                  const std::set<std::string>& var_name,
                                  const phi::Place& place,
93
                                  Name2VariableMap* params_dict) const {
94 95 96
  VLOG(3) << "ReadTensorData from: " << file_name;
  std::ifstream fin(file_name, std::ios::binary);
  platform::DeviceContextPool& pool = platform::DeviceContextPool::Instance();
97
  auto& dev_ctx = *pool.Get(place);
98 99 100 101 102 103
  for (auto it = var_name.begin(); it != var_name.end(); it++) {
    VLOG(3) << "load Tensor: " << *it;
    Variable v;
    // TODO(dev): Support framework::Vocab
    DenseTensor* dense_tesnor = v.GetMutable<DenseTensor>();
    framework::DeserializeFromStream(fin, dense_tesnor, dev_ctx);
104
    (*params_dict)[*it] = std::make_shared<Variable>(v);
105 106 107
  }
}

108
void Deserializer::ReadAttributeData(const std::string& file_path,
109 110 111 112 113 114 115
                                     Name2VariableMap* attrs_dict) const {
  VLOG(3) << "ReadPropertyData from: " << file_path;
  Property p;
  p.Deserialization(file_path);
  *attrs_dict = static_cast<Name2VariableMap>(p.Values());
  return;
}
116

117
framework::ProgramDesc Deserializer::LoadProgram(const std::string& file_name) {
118
  VLOG(3) << "LoadProgram from: " << file_name;
119 120 121 122 123 124 125 126 127
  std::ifstream fin(file_name, std::ios::in | std::ios::binary);
  fin.seekg(0, std::ios::end);
  std::string buffer(fin.tellg(), ' ');
  fin.seekg(0, std::ios::beg);
  fin.read(&buffer[0], buffer.size());
  fin.close();
  return framework::ProgramDesc(buffer);
}

128
Layer Load(const std::string& file_path, const phi::Place& place) {
129
  auto deserializer = Deserializer();
130
  return deserializer(file_path, place);
131 132 133 134
}

}  // namespace jit
}  // namespace paddle