// Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #include "paddle/fluid/operators/abs_op.h" #include "paddle/fluid/operators/elementwise/elementwise_op_impl.cu.h" #include "paddle/fluid/platform/complex128.h" #include "paddle/fluid/platform/complex64.h" #include "paddle/fluid/platform/float16.h" namespace paddle { namespace operators { template struct CudaAbsFunctor; template struct CudaAbsFunctor>> { __device__ __forceinline__ math::Real operator()(const T* args) const { return abs(args[0]); } }; template struct CudaAbsFunctor>> { __device__ __forceinline__ T operator()(const T* args) const { return std::abs(args[0]); } }; template class AbsKernel : public framework::OpKernel { public: void Compute(const framework::ExecutionContext& context) const override { const Tensor* x = context.Input("X"); Tensor* out = context.Output("Out"); out->mutable_data>(context.GetPlace()); auto& dev_ctx = context.template device_context(); std::vector ins = {x}; std::vector outs = {out}; auto functor = CudaAbsFunctor(); LaunchSameDimsElementwiseCudaKernel>(dev_ctx, ins, &outs, functor); } }; } // namespace operators } // namespace paddle namespace ops = paddle::operators; namespace plat = paddle::platform; REGISTER_OP_CUDA_KERNEL( abs, ops::AbsKernel, ops::AbsKernel, ops::AbsKernel, ops::AbsKernel, ops::AbsKernel, ops::AbsKernel>, ops::AbsKernel>); REGISTER_OP_CUDA_KERNEL( abs_grad, ops::AbsGradKernel, ops::AbsGradKernel, ops::AbsGradKernel, ops::AbsGradKernel, ops::AbsGradKernel, ops::AbsGradKernel>, ops::AbsGradKernel>); REGISTER_OP_CUDA_KERNEL( abs_grad_grad, ops::AbsDoubleGradKernel, ops::AbsDoubleGradKernel, ops::AbsDoubleGradKernel, ops::AbsDoubleGradKernel, ops::AbsDoubleGradKernel, ops::AbsDoubleGradKernel>, ops::AbsDoubleGradKernel>);