load_op.cc 5.4 KB
Newer Older
1
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.
Y
Yu Yang 已提交
2

L
Luo Tao 已提交
3 4 5
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
Y
Yu Yang 已提交
6

L
Luo Tao 已提交
7
    http://www.apache.org/licenses/LICENSE-2.0
Y
Yu Yang 已提交
8

L
Luo Tao 已提交
9 10 11 12 13
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */
D
dzhwinter 已提交
14
#include <fstream>
Y
Yu Yang 已提交
15

K
Kexin Zhao 已提交
16
#include "paddle/fluid/framework/data_type_transform.h"
Y
Yi Wang 已提交
17 18
#include "paddle/fluid/framework/op_registry.h"
#include "paddle/fluid/platform/device_context.h"
19
#include "paddle/fluid/platform/profiler.h"
Y
Yu Yang 已提交
20 21 22 23

namespace paddle {
namespace operators {

24
class LoadOp : public framework::OperatorWithKernel {
Y
Yu Yang 已提交
25
 public:
26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63
  using framework::OperatorWithKernel::OperatorWithKernel;

  void InferShape(framework::InferShapeContext *ctx) const override {}

 protected:
  framework::OpKernelType GetExpectedKernelType(
      const framework::ExecutionContext &ctx) const override {
    framework::OpKernelType kt = framework::OpKernelType(
        framework::proto::VarType::FP32, platform::CPUPlace());
    return kt;
  }
};

class LoadOpProtoMaker : public framework::OpProtoAndCheckerMaker {
 public:
  void Make() override {
    AddOutput("Out", "The LoDTensor / SelectedRows need to be loaded");
    AddAttr<bool>(
        "load_as_fp16",
        "If true, the tensor will be first loaded and then "
        "converted to float16 data type. Otherwise, the tensor will be "
        "directly loaded without data type conversion. Default is false.")
        .SetDefault(false);
    AddAttr<std::string>("file_path",
                         R"(Variable will be loaded from "file_path")")
        .AddCustomChecker(
            [](const std::string &path) { return !path.empty(); });
    AddComment(
        "Load operator will load a LoDTensor / SelectedRows variable from disk "
        "file.");
  }
};

template <typename DeviceContext, typename T>
class LoadOpKernel : public framework::OpKernel<T> {
 public:
  void Compute(const framework::ExecutionContext &ctx) const override {
    auto place = ctx.GetPlace();
T
tangwei12 已提交
64 65
    // FIXME(yuyang18): We save variable to local file now, but we should change
    // it to save an output stream.
66
    auto filename = ctx.Attr<std::string>("file_path");
67
    std::ifstream fin(filename, std::ios::binary);
68
    PADDLE_ENFORCE(static_cast<bool>(fin), "Cannot open file %s for load op",
Y
Yu Yang 已提交
69 70
                   filename);

71 72 73 74 75 76 77
    auto out_var_name = ctx.Outputs("Out").data();
    auto *out_var = ctx.OutputVar("Out");

    PADDLE_ENFORCE(out_var != nullptr, "Output variable %s cannot be found ",
                   out_var_name);

    PADDLE_ENFORCE(out_var != nullptr, "Output variable cannot be found ");
Y
Yu Yang 已提交
78

T
tangwei12 已提交
79
    if (out_var->IsType<framework::LoDTensor>()) {
80
      LoadLodTensor(fin, place, out_var, ctx);
T
tangwei12 已提交
81
    } else if (out_var->IsType<framework::SelectedRows>()) {
82
      LoadSelectedRows(fin, place, out_var);
T
tangwei12 已提交
83 84 85 86
    } else {
      PADDLE_ENFORCE(
          false,
          "Load only support LoDTensor and SelectedRows, %s has wrong type",
T
tangwei12 已提交
87
          out_var_name);
T
tangwei12 已提交
88
    }
T
tangwei12 已提交
89
  }
T
tangwei12 已提交
90

T
tangwei12 已提交
91
  void LoadLodTensor(std::istream &fin, const platform::Place &place,
92 93
                     framework::Variable *var,
                     const framework::ExecutionContext &ctx) const {
T
tangwei12 已提交
94 95 96
    // get device context from pool
    platform::DeviceContextPool &pool = platform::DeviceContextPool::Instance();
    auto &dev_ctx = *pool.Get(place);
T
tangwei12 已提交
97
    auto *tensor = var->GetMutable<framework::LoDTensor>();
T
tangwei12 已提交
98
    DeserializeFromStream(fin, tensor, dev_ctx);
K
Kexin Zhao 已提交
99

100
    auto load_as_fp16 = ctx.Attr<bool>("load_as_fp16");
Y
Yu Yang 已提交
101
    auto in_dtype = tensor->type();
K
Kexin Zhao 已提交
102 103 104 105 106 107 108
    auto out_dtype = load_as_fp16 ? framework::proto::VarType::FP16 : in_dtype;

    if (in_dtype != out_dtype) {
      // convert to float16 tensor
      auto in_kernel_type = framework::OpKernelType(in_dtype, place);
      auto out_kernel_type = framework::OpKernelType(out_dtype, place);
      framework::LoDTensor fp16_tensor;
K
Kexin Zhao 已提交
109 110
      // copy LoD info to the new tensor
      fp16_tensor.set_lod(tensor->lod());
K
Kexin Zhao 已提交
111 112
      framework::TransDataType(in_kernel_type, out_kernel_type, *tensor,
                               &fp16_tensor);
K
Kexin Zhao 已提交
113

K
Kexin Zhao 已提交
114
      // reset output tensor
T
tangwei12 已提交
115 116
      var->Clear();
      tensor = var->GetMutable<framework::LoDTensor>();
K
Kexin Zhao 已提交
117 118
      tensor->set_lod(fp16_tensor.lod());
      tensor->ShareDataWith(fp16_tensor);
T
tangwei12 已提交
119
    }
T
tangwei12 已提交
120 121
  }

T
tangwei12 已提交
122
  void LoadSelectedRows(std::istream &fin, const platform::Place &place,
T
tangwei12 已提交
123
                        framework::Variable *var) const {
T
tangwei12 已提交
124
    auto *selectedRows = var->GetMutable<framework::SelectedRows>();
T
tangwei12 已提交
125 126 127 128
    // get device context from pool
    platform::DeviceContextPool &pool = platform::DeviceContextPool::Instance();
    auto &dev_ctx = *pool.Get(place);
    framework::DeserializeFromStream(fin, selectedRows, dev_ctx);
T
tangwei12 已提交
129
    selectedRows->SyncIndex();
Y
Yu Yang 已提交
130 131 132 133 134 135 136 137
  }
};

}  // namespace operators
}  // namespace paddle
namespace ops = paddle::operators;

REGISTER_OPERATOR(load, ops::LoadOp, ops::LoadOpProtoMaker);
138 139 140 141 142 143

REGISTER_OP_CPU_KERNEL(
    load, ops::LoadOpKernel<paddle::platform::CPUDeviceContext, float>,
    ops::LoadOpKernel<paddle::platform::CPUDeviceContext, double>,
    ops::LoadOpKernel<paddle::platform::CPUDeviceContext, int>,
    ops::LoadOpKernel<paddle::platform::CPUDeviceContext, int64_t>);