/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved. Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. You may obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0 Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. */ #pragma once #include // for max #include #include #include #include #include "paddle/fluid/framework/data_layout.h" #include "paddle/fluid/framework/op_registry.h" #include "paddle/fluid/framework/operator.h" #include "paddle/fluid/operators/elementwise/elementwise_op_function.h" #ifdef PADDLE_WITH_MKLDNN #include "paddle/fluid/platform/mkldnn_helper.h" #endif namespace paddle { namespace operators { class ElementwiseOp : public framework::OperatorWithKernel { public: using framework::OperatorWithKernel::OperatorWithKernel; using Tensor = framework::Tensor; void InferShape(framework::InferShapeContext *ctx) const override { PADDLE_ENFORCE_EQ(ctx->HasInput("X"), true, "Input(X) of elementwise op should not be null."); PADDLE_ENFORCE_EQ(ctx->HasInput("Y"), true, "Input(Y) of elementwise op should not be null."); PADDLE_ENFORCE_EQ(ctx->HasOutput("Out"), true, "Output(Out) of elementwise op should not be null."); PADDLE_ENFORCE( ctx->GetInputsVarType("Y").front() == framework::proto::VarType::LOD_TENSOR, "The input var's type should be LoDTensor, but the received is %s [%s]", ctx->GetInputsVarType("Y").front(), ctx->Inputs("Y").front()); if (ctx->GetInputsVarType("X").front() == framework::proto::VarType::SELECTED_ROWS) { PADDLE_ENFORCE_EQ( ctx->GetInputDim("Y").size(), 1u, "ShapeError: For elementwise_op, if X is Sparse(VarType.SELECTED_ROWS" "), Y must be scalar. But reveived the dimension of Y = %s", ctx->GetInputDim("Y").size()); PADDLE_ENFORCE_EQ( ctx->GetInputDim("Y")[0], 1, "ShapeError: For elementwise_op, if X is Sparse(VarType.SELECTED_ROWS" "), Y must be scalar. But reveived the first dimension of Y = %s", ctx->GetInputDim("Y")[0]); } else if (ctx->GetInputsVarType("X").front() != framework::proto::VarType::LOD_TENSOR) { PADDLE_THROW("X's type[%s] is not supported by elementwise_op.", ctx->GetInputsVarType("X").front()); } if (ctx->GetInputDim("X") == ctx->GetInputDim("Y")) { ctx->ShareDim("X", /*->*/ "Out"); ctx->ShareLoD("X", /*->*/ "Out"); } else { auto x_dims = ctx->GetInputDim("X"); auto y_dims = ctx->GetInputDim("Y"); int max_dim = std::max(x_dims.size(), y_dims.size()); int axis = ctx->Attrs().Get("axis"); axis = (axis == -1 ? std::abs(x_dims.size() - y_dims.size()) : axis); std::vector x_dims_array(max_dim); std::vector y_dims_array(max_dim); std::vector out_dims_array(max_dim); GetBroadcastDimsArrays(x_dims, y_dims, x_dims_array.data(), y_dims_array.data(), out_dims_array.data(), max_dim, axis); ctx->SetOutputDim("Out", framework::make_ddim(out_dims_array)); // to do ctx->ShareLoD("X", /*->*/ "Out"); } } framework::OpKernelType GetExpectedKernelType( const framework::ExecutionContext &ctx) const override { auto input_data_type = OperatorWithKernel::IndicateVarDataType(ctx, "X"); #ifdef PADDLE_WITH_MKLDNN // If broadcasting is needed, use native implementation auto CanMKLDNNElementwiseAddBeUsed = [&]() { return ctx.Input("X")->dims() == ctx.Input("Y")->dims(); }; if (platform::CanMKLDNNBeUsed(ctx) && (ctx.Type() != "elementwise_add" || CanMKLDNNElementwiseAddBeUsed())) { return framework::OpKernelType(input_data_type, ctx.GetPlace(), framework::DataLayout::kMKLDNN, framework::LibraryType::kMKLDNN); } #endif return framework::OpKernelType(input_data_type, ctx.GetPlace()); } }; class ElementwiseOpInferVarType : public framework::PassInDtypeAndVarTypeToOutput { protected: std::unordered_map GetInputOutputWithSameType() const override { return std::unordered_map{{"X", /*->*/ "Out"}}; } }; class ElementwiseOpMaker : public framework::OpProtoAndCheckerMaker { public: void Make() final { AddInputX(); AddInputY(); AddOpOutput(); AddAttr("axis", "(int, default -1). If X.dimension != Y.dimension," "Y.dimension must be a subsequence of x.dimension. And axis " "is the start dimension index " "for broadcasting Y onto X. ") .SetDefault(-1) .EqualGreaterThan(-1); AddAttr("use_mkldnn", "(bool, default false). Used by MKLDNN.") .SetDefault(false); AddAttr("x_data_format", "This parameter is no longer used.") .SetDefault(""); AddAttr("y_data_format", "This parameter is no longer used.") .SetDefault(""); AddOpComment(); } protected: virtual void AddInputX() { AddInput("X", "(Tensor), The first input tensor of elementwise op."); } virtual void AddInputY() { AddInput("Y", "(Tensor), The second input tensor of elementwise op."); } virtual void AddOpOutput() { AddOutput("Out", "N-dimension tensor. A location into which the result is stored. " "It's dimension " "equals with x"); } virtual void AddOpComment() { AddComment(GetCommentExamples()); } virtual std::string GetOpFuntionality() const { return ""; } virtual std::string GetName() const = 0; virtual std::string GetEquation() const = 0; std::string GetCommentExamples() const { return string::Sprintf(R"DOC( Elementwise %s Operator. %s The equation is: $$%s$$ - $X$: a tensor of any dimension. - $Y$: a tensor whose dimensions must be less than or equal to the dimensions of $X$. There are two cases for this operator: 1. The shape of $Y$ is the same with $X$. 2. The shape of $Y$ is a continuous subsequence of $X$. For case 2: 1. Broadcast $Y$ to match the shape of $X$, where $axis$ is the start dimension index for broadcasting $Y$ onto $X$. 2. If $axis$ is -1 (default), $axis = rank(X) - rank(Y)$. 3. The trailing dimensions of size 1 for $Y$ will be ignored for the consideration of subsequence, such as shape(Y) = (2, 1) => (2). For example: .. code-block:: text shape(X) = (2, 3, 4, 5), shape(Y) = (,) shape(X) = (2, 3, 4, 5), shape(Y) = (5,) shape(X) = (2, 3, 4, 5), shape(Y) = (4, 5), with axis=-1(default) or axis=2 shape(X) = (2, 3, 4, 5), shape(Y) = (3, 4), with axis=1 shape(X) = (2, 3, 4, 5), shape(Y) = (2), with axis=0 shape(X) = (2, 3, 4, 5), shape(Y) = (2, 1), with axis=0 )DOC", GetName(), GetOpFuntionality(), GetEquation()); } }; class ElementwiseOpGrad : public framework::OperatorWithKernel { public: using framework::OperatorWithKernel::OperatorWithKernel; using Tensor = framework::Tensor; void InferShape(framework::InferShapeContext *ctx) const override { auto out_grad_name = framework::GradVarName("Out"); PADDLE_ENFORCE_EQ(ctx->HasInput("Y"), true, "Input(Y) should not be null."); PADDLE_ENFORCE_EQ(ctx->HasInput(out_grad_name), true, "Input(Out@GRAD) should not be null."); auto x_grad_name = framework::GradVarName("X"); auto y_grad_name = framework::GradVarName("Y"); if (ctx->HasOutput(x_grad_name)) { ctx->ShareDim("X", /*->*/ x_grad_name); ctx->ShareLoD("X", /*->*/ x_grad_name); } if (ctx->HasOutput(y_grad_name)) { ctx->ShareDim("Y", /*->*/ y_grad_name); ctx->ShareLoD("Y", /*->*/ y_grad_name); } } framework::OpKernelType GetExpectedKernelType( const framework::ExecutionContext &ctx) const override { auto input_data_type = OperatorWithKernel::IndicateVarDataType( ctx, framework::GradVarName("Out")); #ifdef PADDLE_WITH_MKLDNN // If broadcasting is needed, use native implementation auto CanMKLDNNElementwiseAddGradBeUsed = [&]() { auto dx = ctx.Output(framework::GradVarName("X")); auto dy = ctx.Output(framework::GradVarName("Y")); return (dx != nullptr && dy != nullptr && dx->dims() == dy->dims()); }; if (platform::CanMKLDNNBeUsed(ctx) && (ctx.Type() != "elementwise_add_grad" || CanMKLDNNElementwiseAddGradBeUsed())) { return framework::OpKernelType(input_data_type, ctx.GetPlace(), framework::DataLayout::kMKLDNN, framework::LibraryType::kMKLDNN); } #endif return framework::OpKernelType(input_data_type, ctx.GetPlace()); } }; class ElementwiseOpDoubleGrad : public framework::OperatorWithKernel { public: using framework::OperatorWithKernel::OperatorWithKernel; using Tensor = framework::Tensor; void InferShape(framework::InferShapeContext *ctx) const override { auto x_grad_name = framework::GradVarName("X"); auto y_grad_name = framework::GradVarName("Y"); if (ctx->HasOutput(x_grad_name)) { ctx->ShareDim("X", x_grad_name); ctx->ShareLoD("X", x_grad_name); } if (ctx->HasOutput(y_grad_name)) { ctx->ShareDim("Y", y_grad_name); ctx->ShareLoD("Y", y_grad_name); } if (ctx->HasOutput("DDOut")) { ctx->ShareDim("DOut", "DDOut"); ctx->ShareLoD("DOut", "DDOut"); } } framework::OpKernelType GetExpectedKernelType( const framework::ExecutionContext &ctx) const override { auto input_data_type = OperatorWithKernel::IndicateVarDataType(ctx, "DOut"); #ifdef PADDLE_WITH_MKLDNN if (platform::CanMKLDNNBeUsed(ctx)) { return framework::OpKernelType(input_data_type, ctx.GetPlace(), framework::DataLayout::kMKLDNN, framework::LibraryType::kMKLDNN); } #endif return framework::OpKernelType(input_data_type, ctx.GetPlace()); } }; class ElementwiseOpDoubleGradWithoutDXDY : public framework::OperatorWithKernel { public: using framework::OperatorWithKernel::OperatorWithKernel; using Tensor = framework::Tensor; void InferShape(framework::InferShapeContext *ctx) const override { if (ctx->HasOutput("DDOut")) { ctx->ShareDim("DOut", "DDOut"); ctx->ShareLoD("DOut", "DDOut"); } } framework::OpKernelType GetExpectedKernelType( const framework::ExecutionContext &ctx) const override { framework::proto::VarType::Type input_data_type; if (ctx.HasInput("DDX") == false) { PADDLE_ENFORCE_EQ(ctx.HasInput("DDY"), true, "Input(DDY) should not be null"); input_data_type = OperatorWithKernel::IndicateVarDataType(ctx, "DDY"); } else if (ctx.HasInput("DDY") == false) { PADDLE_ENFORCE_EQ(ctx.HasInput("DDX"), true, "Input(DDX) should not be null"); input_data_type = OperatorWithKernel::IndicateVarDataType(ctx, "DDX"); } else { input_data_type = OperatorWithKernel::IndicateVarDataType(ctx, "DDX"); } #ifdef PADDLE_WITH_MKLDNN if (platform::CanMKLDNNBeUsed(ctx)) { return framework::OpKernelType(input_data_type, ctx.GetPlace(), framework::DataLayout::kMKLDNN, framework::LibraryType::kMKLDNN); } #endif return framework::OpKernelType(input_data_type, ctx.GetPlace()); } }; template class ElemwiseGradKernel : public framework::OpKernel { public: void Compute(const framework::ExecutionContext &context) const override { auto *dx = context.Output(framework::GradVarName("X")); if (dx != nullptr) { auto &dout = *context.Input(framework::GradVarName("Out")); dx->set_lod(dout.lod()); } } }; DECLARE_INPLACE_OP_INFERER(ElementwiseOpInplace, {"X", "Out"}); DECLARE_INPLACE_OP_INFERER(ElementwiseGradOpInplace, {framework::GradVarName("Out"), framework::GradVarName("X")}); DECLARE_INPLACE_OP_INFERER(ElementwiseDoubleGradOpInplace, {"DDX", "DDOut"}); DECLARE_NO_NEED_BUFFER_VARS_INFERENCE(ElementwiseGradNoBufVarsInference, "X", "Y"); DECLARE_NO_NEED_BUFFER_VARS_INFERENCE(ElementwiseDoubleGradNoBufVarsInference, "Y", "DOut"); } // namespace operators } // namespace paddle #define REGISTER_ELEMWISE_GRAD_MAKER(kernel_type, op_name) \ template \ class kernel_type##GradMaker \ : public paddle::framework::SingleGradOpMaker { \ public: \ using ::paddle::framework::SingleGradOpMaker::SingleGradOpMaker; \ \ protected: \ void Apply(::paddle::framework::GradOpPtr op) const override { \ op->SetType(#kernel_type "_grad"); \ op->SetInput("X", this->Input("X")); \ op->SetInput("Y", this->Input("Y")); \ op->SetInput(::paddle::framework::GradVarName("Out"), \ this->OutputGrad("Out")); \ op->SetAttrMap(this->Attrs()); \ op->SetOutput(::paddle::framework::GradVarName("X"), \ this->InputGrad("X")); \ op->SetOutput(::paddle::framework::GradVarName("Y"), \ this->InputGrad("Y")); \ } \ } #define REGISTER_ELEMWISE_EXPLICIT_OP_WITHOUT_GRAD(op_type, op_name) \ REGISTER_OPERATOR(op_type, ::paddle::operators::ElementwiseOp, \ ::paddle::operators::Elementwise##op_name##OpMaker, \ ::paddle::operators::ElementwiseOpInferVarType, \ op_type##GradMaker<::paddle::framework::OpDesc>, \ op_type##GradMaker<::paddle::imperative::OpBase>, \ ::paddle::operators::ElementwiseOpInplace);