load_op.cc 5.6 KB
Newer Older
1
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.
Y
Yu Yang 已提交
2

L
Luo Tao 已提交
3 4 5
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
Y
Yu Yang 已提交
6

L
Luo Tao 已提交
7
    http://www.apache.org/licenses/LICENSE-2.0
Y
Yu Yang 已提交
8

L
Luo Tao 已提交
9 10 11 12 13
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */
D
dzhwinter 已提交
14
#include <fstream>
D
dzhwinter 已提交
15
#include <memory>
Y
Yu Yang 已提交
16

K
Kexin Zhao 已提交
17
#include "paddle/fluid/framework/data_type_transform.h"
Y
Yi Wang 已提交
18 19
#include "paddle/fluid/framework/op_registry.h"
#include "paddle/fluid/platform/device_context.h"
20
#include "paddle/fluid/platform/profiler.h"
Y
Yu Yang 已提交
21 22 23 24 25 26 27 28 29 30

namespace paddle {
namespace operators {

class LoadOp : public framework::OperatorBase {
 public:
  LoadOp(const std::string &type, const framework::VariableNameMap &inputs,
         const framework::VariableNameMap &outputs,
         const framework::AttributeMap &attrs)
      : OperatorBase(type, inputs, outputs, attrs) {}
31 32 33 34

 private:
  void RunImpl(const framework::Scope &scope,
               const platform::Place &place) const override {
T
tangwei12 已提交
35 36
    // FIXME(yuyang18): We save variable to local file now, but we should change
    // it to save an output stream.
Y
Yu Yang 已提交
37
    auto filename = Attr<std::string>("file_path");
D
dzhwinter 已提交
38 39 40 41 42 43 44 45 46
    auto format = Attr<std::string>("format");
    std::unique_ptr<std::ifstream> fin;
    if (format == "windows") {
      fin.reset(new std::ifstream(filename,
                                  std::ios_base::in | std::ios_base::binary));
    } else {
      fin.reset(new std::ifstream(filename));
    }
    PADDLE_ENFORCE(static_cast<bool>(*fin), "Cannot open file %s for load op",
Y
Yu Yang 已提交
47 48 49 50 51 52 53
                   filename);

    auto out_var_name = Output("Out");
    auto *out_var = scope.FindVar(out_var_name);
    PADDLE_ENFORCE(out_var != nullptr, "Output variable %s cannot be found",
                   out_var_name);

T
tangwei12 已提交
54
    if (out_var->IsType<framework::LoDTensor>()) {
D
dzhwinter 已提交
55
      LoadLodTensor(*fin, place, out_var);
T
tangwei12 已提交
56
    } else if (out_var->IsType<framework::SelectedRows>()) {
D
dzhwinter 已提交
57
      LoadSelectedRows(*fin, place, out_var);
T
tangwei12 已提交
58 59 60 61
    } else {
      PADDLE_ENFORCE(
          false,
          "Load only support LoDTensor and SelectedRows, %s has wrong type",
T
tangwei12 已提交
62
          out_var_name);
T
tangwei12 已提交
63
    }
T
tangwei12 已提交
64
  }
T
tangwei12 已提交
65

T
tangwei12 已提交
66
  void LoadLodTensor(std::istream &fin, const platform::Place &place,
T
tangwei12 已提交
67 68 69 70
                     framework::Variable *var) const {
    // get device context from pool
    platform::DeviceContextPool &pool = platform::DeviceContextPool::Instance();
    auto &dev_ctx = *pool.Get(place);
T
tangwei12 已提交
71
    auto *tensor = var->GetMutable<framework::LoDTensor>();
T
tangwei12 已提交
72
    DeserializeFromStream(fin, tensor, dev_ctx);
K
Kexin Zhao 已提交
73 74 75 76 77 78 79 80 81 82

    auto load_as_fp16 = Attr<bool>("load_as_fp16");
    auto in_dtype = framework::ToDataType(tensor->type());
    auto out_dtype = load_as_fp16 ? framework::proto::VarType::FP16 : in_dtype;

    if (in_dtype != out_dtype) {
      // convert to float16 tensor
      auto in_kernel_type = framework::OpKernelType(in_dtype, place);
      auto out_kernel_type = framework::OpKernelType(out_dtype, place);
      framework::LoDTensor fp16_tensor;
K
Kexin Zhao 已提交
83 84
      // copy LoD info to the new tensor
      fp16_tensor.set_lod(tensor->lod());
K
Kexin Zhao 已提交
85 86
      framework::TransDataType(in_kernel_type, out_kernel_type, *tensor,
                               &fp16_tensor);
K
Kexin Zhao 已提交
87

K
Kexin Zhao 已提交
88
      // reset output tensor
T
tangwei12 已提交
89 90
      var->Clear();
      tensor = var->GetMutable<framework::LoDTensor>();
K
Kexin Zhao 已提交
91 92
      tensor->set_lod(fp16_tensor.lod());
      tensor->ShareDataWith(fp16_tensor);
T
tangwei12 已提交
93
    }
T
tangwei12 已提交
94 95
  }

T
tangwei12 已提交
96
  void LoadSelectedRows(std::istream &fin, const platform::Place &place,
T
tangwei12 已提交
97
                        framework::Variable *var) const {
T
tangwei12 已提交
98
    auto *selectedRows = var->GetMutable<framework::SelectedRows>();
T
tangwei12 已提交
99 100 101 102
    // get device context from pool
    platform::DeviceContextPool &pool = platform::DeviceContextPool::Instance();
    auto &dev_ctx = *pool.Get(place);
    framework::DeserializeFromStream(fin, selectedRows, dev_ctx);
T
tangwei12 已提交
103
    selectedRows->SyncIndex();
Y
Yu Yang 已提交
104 105 106 107 108
  }
};

class LoadOpProtoMaker : public framework::OpProtoAndCheckerMaker {
 public:
Y
Yu Yang 已提交
109
  void Make() override {
T
tangwei12 已提交
110
    AddOutput("Out", "The LoDTensor / SelectedRows need to be loaded");
K
Kexin Zhao 已提交
111 112 113 114
    AddAttr<bool>(
        "load_as_fp16",
        "If true, the tensor will be first loaded and then "
        "converted to float16 data type. Otherwise, the tensor will be "
Y
yuyang18 已提交
115
        "directly loaded without data type conversion. Default is false.")
K
Kexin Zhao 已提交
116
        .SetDefault(false);
Y
Yu Yang 已提交
117
    AddAttr<std::string>("file_path",
Y
yuyang18 已提交
118
                         R"(Variable will be loaded from "file_path")")
Y
Yu Yang 已提交
119 120
        .AddCustomChecker(
            [](const std::string &path) { return !path.empty(); });
D
dzhwinter 已提交
121 122 123 124 125 126 127 128 129 130 131 132
    AddAttr<std::string>("format",
                         R"DOC((windows|linux)" "saved model file format
                         windows and linux file newline symbol is
different. windows(newline is \n\r) or linux(newline is \r)
So if you set attribute format to windows, then we saved model file in binary.
It can be used both linux and windows. If you set format to linux,
it will save file in normal file, newline symbol is \r. Need to note
that these two format is not inter-compatible.)DOC")
        .SetDefault("linux")
        .AddCustomChecker([](const std::string &s) {
          return s == "windows" || s == "linux";
        });
T
tangwei12 已提交
133 134 135
    AddComment(
        "Load operator will load a LoDTensor / SelectedRows variable from disk "
        "file.");
Y
Yu Yang 已提交
136 137 138 139 140 141 142
  }
};
}  // namespace operators
}  // namespace paddle
namespace ops = paddle::operators;

REGISTER_OPERATOR(load, ops::LoadOp, ops::LoadOpProtoMaker);