/* Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved. Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. Indicesou may obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0 Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. */ #include #include #include #include "paddle/fluid/framework/infershape_utils.h" #include "paddle/fluid/framework/op_registry.h" #include "paddle/phi/infermeta/backward.h" #include "paddle/phi/infermeta/binary.h" namespace paddle { namespace operators { class Unpool2dOpMaker : public framework::OpProtoAndCheckerMaker { public: void Make() override { AddInput( "X", "(Tensor) The input tensor of unpool operator. " "The format of input tensor is NCHW. Where N is batch size, C is the " "number of channels, H and W is the height and width of feature."); AddInput( "Indices", "(Tensor) The input tensor of the indices given out by MaxPool2d. " "The format of input tensor is NCHW. Where N is batch size, C is the " "number of channels, H and W is the height and width of feature."); AddOutput("Out", "(Tensor) The output tensor of unpool operator." "The format of output tensor is also NCHW." "Where N is batch size, C is " "the number of channels, H and W is the height and " "width of feature."); AddAttr>( "ksize", "(vector), the unpooling window size(height, width) " "of unpooling operator."); AddAttr>("strides", "(vector, default:{1, 1}), " "strides (height, width) of unpooling operator.") .SetDefault({1, 1}); AddAttr>("paddings", "(vector default:{0,0}), " "paddings (height, width) of unpooling operator.") .SetDefault({0, 0}); AddAttr( "unpooling_type", "(string), unpooling type, can be \"max\" for max-unpooling ") .InEnum({"max"}); AddAttr>("output_size", "(vector, optional). The shape of output.") .SetDefault({0, 0}) .SupportTensor(); AddAttr( "data_format", "(string, default NCHW) Only used in " "An optional string from: \"NHWC\", \"NCHW\". " "Defaults to \"NHWC\". Specify the data format of the output data, " "the input will be transformed automatically. ") .SetDefault("NCHW"); AddComment(R"DOC( Input shape is: $(N, C_{in}, H_{in}, W_{in})$, Output shape is: $(N, C_{out}, H_{out}, W_{out})$, where $$ H_{out} = (H_{in}-1) * strides[0] - 2 * paddings[0] + ksize[0] \\ W_{out} = (W_{in}-1) * strides[1] - 2 * paddings[1] + ksize[1] $$ Paper: http://www.matthewzeiler.com/wp-content/uploads/2017/07/iccv2011.pdf )DOC"); } }; class Unpool3dOpMaker : public framework::OpProtoAndCheckerMaker { public: void Make() override { AddInput( "X", "(Tensor) The input tensor of unpool operator. " "The format of input tensor is NCDHW. Where N is batch size, C is the " "number of channels, D, H and W is the depth, height and width of " "feature."); AddInput( "Indices", "(Tensor) The input tensor of the indices given out by MaxPool3d. " "The format of input tensor is NCDHW. Where N is batch size, C is the " "number of channels, D, H and W is the depth, height and width of " "feature."); AddOutput("Out", "(Tensor) The output tensor of unpool operator." "The format of output tensor is also NCDHW." "Where N is batch size, C is " "the number of channels, D, H and W is the depth, height and " "width of feature."); AddAttr>( "ksize", "(vector), the unpooling window size(depth, height, width) " "of unpooling operator."); AddAttr>( "strides", "(vector, default:{1, 1, 1}), " "strides (depth, height, width) of unpooling operator.") .SetDefault({1, 1, 1}); AddAttr>( "paddings", "(vector default:{0, 0,0}), " "paddings (depth, height, width) of unpooling operator.") .SetDefault({0, 0, 0}); AddAttr( "unpooling_type", "(string), unpooling type, can be \"max\" for max-unpooling ") .InEnum({"max"}); AddAttr>("output_size", "(vector, optional). The shape of output.") .SetDefault({0, 0, 0}); AddAttr( "data_format", "(string, default NCDHW)" "Defaults to \"NCDHW\". Specify the data format of the output data, ") .SetDefault("NCDHW"); AddComment(R"DOC( Input shape is: $(N, C_{in}, D_{in}, H_{in}, W_{in})$, Output shape is: $(N, C_{out}, D_{out}, H_{out}, W_{out})$, where $$ D_{out} = (D_{in}-1) * strides[0] - 2 * paddings[0] + ksize[0] \\ H_{out} = (H_{in}-1) * strides[1] - 2 * paddings[1] + ksize[1] \\ W_{out} = (W_{in}-1) * strides[2] - 2 * paddings[2] + ksize[2] $$ )DOC"); } }; int UnpoolOutputSize(int input_size, int ksize, int padding, int stride) { int output_size = (input_size - 1) * stride - 2 * padding + ksize; return output_size; } class UnpoolOp : public framework::OperatorWithKernel { protected: phi::KernelKey GetExpectedKernelType( const framework::ExecutionContext& ctx) const override { return phi::KernelKey(OperatorWithKernel::IndicateVarDataType(ctx, "X"), ctx.GetPlace()); } public: using framework::OperatorWithKernel::OperatorWithKernel; }; class Unpool3dOp : public framework::OperatorWithKernel { protected: phi::KernelKey GetExpectedKernelType( const framework::ExecutionContext& ctx) const override { return phi::KernelKey(OperatorWithKernel::IndicateVarDataType(ctx, "X"), ctx.GetPlace()); } public: using framework::OperatorWithKernel::OperatorWithKernel; }; template class UnpoolOpGradMaker : public framework::SingleGradOpMaker { public: using framework::SingleGradOpMaker::SingleGradOpMaker; void Apply(GradOpPtr op) const override { op->SetType(this->ForwardOpType() + "_grad"); op->SetInput("X", this->Input("X")); op->SetInput("Indices", this->Input("Indices")); op->SetInput("Out", this->Output("Out")); op->SetInput(framework::GradVarName("Out"), this->OutputGrad("Out")); op->SetOutput(framework::GradVarName("X"), this->InputGrad("X")); op->SetAttrMap(this->Attrs()); } }; template class Unpool3dOpGradMaker : public framework::SingleGradOpMaker { public: using framework::SingleGradOpMaker::SingleGradOpMaker; void Apply(GradOpPtr op) const override { op->SetType(this->ForwardOpType() + "_grad"); op->SetInput("X", this->Input("X")); op->SetInput("Indices", this->Input("Indices")); op->SetInput("Out", this->Output("Out")); op->SetInput(framework::GradVarName("Out"), this->OutputGrad("Out")); op->SetOutput(framework::GradVarName("X"), this->InputGrad("X")); op->SetAttrMap(this->Attrs()); } }; class UnpoolOpGrad : public framework::OperatorWithKernel { protected: phi::KernelKey GetExpectedKernelType( const framework::ExecutionContext& ctx) const override { return phi::KernelKey(OperatorWithKernel::IndicateVarDataType(ctx, "X"), ctx.GetPlace()); } public: using framework::OperatorWithKernel::OperatorWithKernel; }; class Unpool3dOpGrad : public framework::OperatorWithKernel { protected: phi::KernelKey GetExpectedKernelType( const framework::ExecutionContext& ctx) const override { return phi::KernelKey(OperatorWithKernel::IndicateVarDataType(ctx, "X"), ctx.GetPlace()); } public: using framework::OperatorWithKernel::OperatorWithKernel; }; } // namespace operators } // namespace paddle namespace ops = paddle::operators; DECLARE_INFER_SHAPE_FUNCTOR(unpool, UnpoolInferShapeFunctor, PD_INFER_META(phi::UnpoolInferMeta)); REGISTER_OPERATOR(unpool, ops::UnpoolOp, ops::Unpool2dOpMaker, ops::UnpoolOpGradMaker, ops::UnpoolOpGradMaker, UnpoolInferShapeFunctor); DECLARE_INFER_SHAPE_FUNCTOR(unpool_grad, UnpoolGradInferShapeFunctor, PD_INFER_META(phi::UnchangedInferMeta)); REGISTER_OPERATOR(unpool_grad, ops::UnpoolOpGrad, UnpoolGradInferShapeFunctor); DECLARE_INFER_SHAPE_FUNCTOR(unpool, Unpool3dInferShapeFunctor, PD_INFER_META(phi::Unpool3dInferMeta)); REGISTER_OPERATOR(unpool3d, ops::Unpool3dOp, ops::Unpool3dOpMaker, ops::Unpool3dOpGradMaker, ops::Unpool3dOpGradMaker, Unpool3dInferShapeFunctor); DECLARE_INFER_SHAPE_FUNCTOR(unpool3d_grad, Unpool3dGradInferShapeFunctor, PD_INFER_META(phi::UnchangedInferMeta)); REGISTER_OPERATOR(unpool3d_grad, ops::Unpool3dOpGrad, Unpool3dGradInferShapeFunctor);