reshape_op.cc 7.9 KB
Newer Older
1
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.
Y
Yibing Liu 已提交
2

L
Luo Tao 已提交
3 4 5
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
Y
Yibing Liu 已提交
6

L
Luo Tao 已提交
7
    http://www.apache.org/licenses/LICENSE-2.0
Y
Yibing Liu 已提交
8

L
Luo Tao 已提交
9 10 11 12 13
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */
Y
Yibing Liu 已提交
14

Y
Yi Wang 已提交
15
#include "paddle/fluid/operators/reshape_op.h"
Y
Yibing Liu 已提交
16 17 18 19 20 21 22 23 24 25 26

namespace paddle {
namespace operators {

class ReshapeOp : public framework::OperatorWithKernel {
 public:
  ReshapeOp(const std::string &type, const framework::VariableNameMap &inputs,
            const framework::VariableNameMap &outputs,
            const framework::AttributeMap &attrs)
      : OperatorWithKernel(type, inputs, outputs, attrs) {}

27
  void InferShape(framework::InferShapeContext *ctx) const override {
Q
Qiao Longfei 已提交
28 29 30 31
    PADDLE_ENFORCE(ctx->HasInput("X"),
                   "Input(X) of ReshapeOp should not be null.");
    PADDLE_ENFORCE(ctx->HasOutput("Out"),
                   "Output(Out) of ReshapeOp should not be null.");
32

Y
ying 已提交
33
    const std::vector<int> &shape = ctx->Attrs().Get<std::vector<int>>("shape");
C
caoying03 已提交
34 35
    PADDLE_ENFORCE(!shape.empty(),
                   "The shape information must be set by Attr(shape).");
Y
ying 已提交
36

C
caoying03 已提交
37
    std::vector<int64_t> output_shape;
Q
Qiao Longfei 已提交
38
    auto x_dims = ctx->GetInputDim("X");
C
caoying03 已提交
39
    bool need_copy_dim = ValidateShape(shape, x_dims, output_shape);
40

C
caoying03 已提交
41 42 43
    if (need_copy_dim) {
      // Some dimensions can only be determined during runtime. Here temporarily
      // set output tensor's shape the same as that of the input tensor.
Y
ying 已提交
44 45
      ctx->SetOutputDim("Out", x_dims);
    } else {
C
caoying03 已提交
46
      ctx->SetOutputDim("Out", framework::make_ddim(output_shape));
D
Fix bug  
dangqingqing 已提交
47
    }
C
caoying03 已提交
48 49 50 51 52 53 54 55

    // NOTE: Reshape op cannot reshape an input sequence batch into an output
    // sequence batch that has a different number of time steps.
    // Here output always shares the LoD information with input. But if
    // Attr(shape) contains 0 or -1, the actual output shape can only be
    // determined during runtime. The check for wheather it is a valid output
    // sequence batch is performed in runtime.
    ctx->ShareLoD("X", /*->*/ "Out");
Y
Yibing Liu 已提交
56
  }
Y
ying 已提交
57 58

 private:
C
caoying03 已提交
59 60
  bool ValidateShape(const std::vector<int> &shape,
                     const framework::DDim &input_dim,
Y
ying 已提交
61
                     std::vector<int64_t> &output_shape) const {
C
caoying03 已提交
62
    // only one dimension can be set to -1, whose size will be automatically
C
caoying03 已提交
63 64 65 66
    // infered.
    const int64_t unknown_index = -1;
    const auto in_size = framework::product(input_dim);
    const auto x_rank = input_dim.size();
Y
ying 已提交
67

C
caoying03 已提交
68 69
    bool need_dim_copy = false;
    std::vector<size_t> neg_dims_idx;
Y
ying 已提交
70
    for (size_t i = 0; i < shape.size(); ++i) {
C
caoying03 已提交
71
      PADDLE_ENFORCE(shape[i] >= 0 || shape[i] == unknown_index,
Y
ying 已提交
72 73
                     "Each input dimension of Attr(shape) must be positive, or "
                     "only one input dimension can be -1.");
C
caoying03 已提交
74 75 76 77 78 79 80 81
      if (shape[i] == unknown_index) {
        neg_dims_idx.push_back(i);
      } else if (shape[i] == 0) {
        PADDLE_ENFORCE_LT(
            i, x_rank,
            "Only dimension less than rank of Input(X) can be set to 0.");
        need_dim_copy = true;
      }
Y
ying 已提交
82 83 84
    }
    PADDLE_ENFORCE_LE(
        neg_dims_idx.size(), 1,
C
caoying03 已提交
85
        "Only one input dimension of Attr(shape) can be unknown.");
Y
ying 已提交
86

C
caoying03 已提交
87 88 89 90 91 92 93
    output_shape.resize(shape.size(), 0);
    std::transform(shape.begin(), shape.end(), output_shape.begin(),
                   [](int a) { return static_cast<int64_t>(a); });

    // some dimension can only be determinted during runtime.
    if (need_dim_copy) return need_dim_copy;

Y
ying 已提交
94 95 96 97 98
    int64_t inferred_dim = 0;
    if (neg_dims_idx.size()) {
      int64_t capacity = std::accumulate(shape.begin(), shape.end(), 1,
                                         std::multiplies<int>());
      inferred_dim = in_size / (-capacity);
C
caoying03 已提交
99 100 101
      PADDLE_ENFORCE_EQ(inferred_dim * (-capacity), in_size,
                        "Invalid shape is given.");
      output_shape[neg_dims_idx[0]] = inferred_dim;
Y
ying 已提交
102
    }
C
caoying03 已提交
103
    return false;
C
caoying03 已提交
104
  }
Y
Yibing Liu 已提交
105 106 107 108
};

class ReshapeOpMaker : public framework::OpProtoAndCheckerMaker {
 public:
109
  ReshapeOpMaker(OpProto *proto, OpAttrChecker *op_checker)
Y
Yibing Liu 已提交
110 111 112
      : OpProtoAndCheckerMaker(proto, op_checker) {
    AddInput("X", "The input tensor of reshape operator.");
    AddOutput("Out", "The output tensor of reshape operator.");
C
caoying03 已提交
113
    AddAttr<std::vector<int>>(
C
caoying03 已提交
114
        "shape", "(std::vector<int>) Target shape of reshape operator.");
Y
Yan Chunwei 已提交
115
    AddAttr<bool>("inplace",
C
caoying03 已提交
116 117 118 119 120
                  "(default: false) Change the source tensor's shape without "
                  "memory copy. When Attr(inplace) is set true, the output "
                  "tensor shares memory with Input(X), otherwise, a new output "
                  "tensor is created, and its data are copied from Input(x).")
        .SetDefault(false);
K
kexinzhao 已提交
121 122
    AddComment(R"DOC(
Reshape Operator.
Y
Yibing Liu 已提交
123

C
caoying03 已提交
124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144
Reshape Input(X) into the shape specified by Attr(shape). The data in Input(X)
are unchanged.

Examples:

1. Given a 3-D tensor Input(X) with a shape [2, 4, 6], and the target shape
specified by Attr(shape) is [6, 8], the reshape operator will transform Input(X)
into a 2-D tensor with shape [6, 8] and leaving Input(X)'s data unchanged.

1. Given a 3-D tensor Input(X) with a shape [2, 4, 6], and the target shape
specified by Attr(shape) is [2, 3, -1, 2], the reshape operator will transform
Input(X) into a 4-D tensor with shape [2, 3, 4, 2] and leaving Input(X)'s data
unchanged. In this case, one and only dimension of Attr(shape) can be set to -1,
the value of this dimension is inferred from the total element number of
Input(X) and remaining dimensions.

1. Given a 3-D tensor Input(X) with a shape [2, 4, 6], and the target shape
specified by Attr(shape) is [-1, 0, 3, 2], the reshape operator will transform
Input(X) into a 4-D tensor with shape [2, 4, 3, 2] and leaving Input(X)'s data
unchanged. In this case, besides -1, 0 means the actual dimension value is going
to be copied from the corresponding dimension of Input(X).
Y
Yibing Liu 已提交
145

C
caoying03 已提交
146
Note:
Y
Yibing Liu 已提交
147

C
caoying03 已提交
148 149 150 151 152 153 154
1. One and only one dimension in Attr(shape) can be set -1. In this case,
the actual dimension value will be infered from the total element number of
Input(X) and remaining dimensions.
1. More than one dimensions in Attr(shape) can be set to 0, which means the real
dimension value will be copied from Input(X) at runtime. Note that the index of
0 can not access Rank(X). For example, Input(X) is a 3-D tensor with shape
[2, 3, 4], Attr(shape) = [2, 3, 2, 0] is an invalid input.
Y
Yibing Liu 已提交
155

Y
Yibing Liu 已提交
156 157 158 159 160 161 162 163 164 165 166 167
)DOC");
  }
};

class ReshapeGradOp : public framework::OperatorWithKernel {
 public:
  ReshapeGradOp(const std::string &type,
                const framework::VariableNameMap &inputs,
                const framework::VariableNameMap &outputs,
                const framework::AttributeMap &attrs)
      : OperatorWithKernel(type, inputs, outputs, attrs) {}

168
  void InferShape(framework::InferShapeContext *ctx) const override {
Q
Qiao Longfei 已提交
169 170 171 172
    PADDLE_ENFORCE(ctx->HasInput("X"), "Input(X) shouldn't be null.");
    PADDLE_ENFORCE(ctx->HasInput(framework::GradVarName("Out")),
                   "Input(Out@GRAD) shouldn't be null.");
    ctx->SetOutputDim(framework::GradVarName("X"), ctx->GetInputDim("X"));
Y
Yibing Liu 已提交
173 174 175 176 177 178
  }
};

}  // namespace operators
}  // namespace paddle
namespace ops = paddle::operators;
179
using CPU = paddle::platform::CPUDeviceContext;
Y
Yibing Liu 已提交
180 181 182

REGISTER_OP(reshape, ops::ReshapeOp, ops::ReshapeOpMaker, reshape_grad,
            ops::ReshapeGradOp);
183 184 185 186 187 188 189 190
REGISTER_OP_CPU_KERNEL(reshape, ops::ReshapeKernel<CPU, float>,
                       ops::ReshapeKernel<CPU, double>,
                       ops::ReshapeKernel<CPU, int>,
                       ops::ReshapeKernel<CPU, int64_t>);
REGISTER_OP_CPU_KERNEL(reshape_grad, ops::ReshapeGradKernel<CPU, float>,
                       ops::ReshapeGradKernel<CPU, double>,
                       ops::ReshapeGradKernel<CPU, int>,
                       ops::ReshapeGradKernel<CPU, int64_t>);