diff --git a/paddle/fluid/operators/activation_op_mlu.cc b/paddle/fluid/operators/activation_op_mlu.cc index 6ba86351e6af55d2d4bf8a8bbb5fb28e30da596d..d1087965f044e35e8c2f7b79bd7fc082cd47b770 100644 --- a/paddle/fluid/operators/activation_op_mlu.cc +++ b/paddle/fluid/operators/activation_op_mlu.cc @@ -399,11 +399,81 @@ class HardSigmoidGradMLUKernel : public framework::OpKernel { } }; +template +class ReciprocalMLUKernel : public framework::OpKernel { + public: + void Compute(const framework::ExecutionContext& ctx) const override { + auto* x = ctx.Input("X"); + auto* out = ctx.Output("Out"); + auto place = ctx.GetPlace(); + out->mutable_data(place); + MLUCnnlTensorDesc x_desc(*x); + MLUCnnlTensorDesc out_desc(*out); + MLUCnnl::Reciprocal( + ctx, x_desc.get(), GetBasePtr(x), out_desc.get(), GetBasePtr(out)); + } +}; + +template +class ReciprocalGradMLUKernel : public framework::OpKernel { + public: + void Compute(const framework::ExecutionContext& ctx) const override { + auto* out = ctx.Input("Out"); + auto* dout = ctx.Input(framework::GradVarName("Out")); + auto* dx = ctx.Output(framework::GradVarName("X")); + auto place = ctx.GetPlace(); + dx->mutable_data(place); + Tensor square_out; + square_out.Resize(out->dims()); + square_out.mutable_data(place); + MLUCnnlTensorDesc out_desc(*out); + MLUCnnlTensorDesc dout_desc(*dout); + MLUCnnlTensorDesc dx_desc(*dx); + MLUCnnlTensorDesc square_out_desc(square_out); + MLUCnnl::Square(ctx, + out_desc.get(), + GetBasePtr(out), + square_out_desc.get(), + GetBasePtr(&square_out)); + cnnlOpTensorDesc_t op_tensor_op = CNNL_OP_TENSOR_MUL; + cnnlDataType_t op_tensor_comp_type = CNNL_DTYPE_FLOAT; + cnnlNanPropagation_t op_tensor_nan_opt = CNNL_NOT_PROPAGATE_NAN; + MLUCnnlOpTensorDesc op_tensor_desc( + op_tensor_op, op_tensor_comp_type, op_tensor_nan_opt); + float alpha1_float = -1; + float alpha2_float = 1; + float beta_float = 0; + MLUCnnl::OpTensor(ctx, + op_tensor_desc.get(), + dout_desc.get(), + GetBasePtr(dout), + square_out_desc.get(), + GetBasePtr(&square_out), + dx_desc.get(), + GetBasePtr(dx), + op_tensor_comp_type, + alpha1_float, + alpha2_float, + beta_float); + } +}; } // namespace operators } // namespace paddle namespace ops = paddle::operators; +// reciprocal +REGISTER_OP_MLU_KERNEL( + reciprocal, + ops::ReciprocalMLUKernel, + ops::ReciprocalMLUKernel); + +REGISTER_OP_MLU_KERNEL( + reciprocal_grad, + ops::ReciprocalGradMLUKernel, + ops::ReciprocalGradMLUKernel); // relu REGISTER_OP_MLU_KERNEL( relu, diff --git a/python/paddle/fluid/tests/unittests/mlu/test_reciprocal_op_mlu.py b/python/paddle/fluid/tests/unittests/mlu/test_reciprocal_op_mlu.py new file mode 100644 index 0000000000000000000000000000000000000000..1791b1dab28b824d32909534b3233aa5aaf23675 --- /dev/null +++ b/python/paddle/fluid/tests/unittests/mlu/test_reciprocal_op_mlu.py @@ -0,0 +1,69 @@ +# Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. + +from __future__ import print_function, division + +import numpy as np +import unittest +import sys + +sys.path.append("..") +from op_test import OpTest, skip_check_grad_ci +import paddle + +paddle.enable_static() + + +class TestMLUReciprocal(OpTest): + + def setUp(self): + self.op_type = "reciprocal" + self.set_mlu() + self.init_dtype() + + np.random.seed(1024) + x = np.random.uniform(1, 2, [11, 17]).astype(self.dtype) + out = np.reciprocal(x) + + self.inputs = {'X': OpTest.np_dtype_to_fluid_dtype(x)} + self.outputs = {'Out': out} + + def test_check_output(self): + self.check_output_with_place(self.place) + + def test_check_grad(self): + self.check_grad_with_place(self.place, ['X'], + 'Out', + max_relative_error=0.01) + + def set_mlu(self): + self.__class__.use_mlu = True + self.place = paddle.MLUPlace(0) + + def init_dtype(self): + self.dtype = np.float32 + + +class TestMLUReciprocalFp16(TestMLUReciprocal): + + def set_mlu(self): + self.__class__.use_mlu = True + self.place = paddle.MLUPlace(0) + + def init_dtype(self): + self.dtype = np.float16 + + +if __name__ == '__main__': + unittest.main()