// Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #pragma once // See Note [ Why still include the fluid headers? ] #include "paddle/phi/kernels/funcs/broadcast_function.h" #include "paddle/phi/kernels/funcs/complex_functors.h" #include "paddle/phi/kernels/funcs/elementwise_base.h" #include "paddle/phi/kernels/funcs/for_range.h" namespace phi { template void ConjKernel(const Context& dev_ctx, const DenseTensor& x, DenseTensor* out) { auto numel = x.numel(); auto* x_data = x.data(); auto* out_data = dev_ctx.template Alloc(out); phi::funcs::ForRange for_range(dev_ctx, numel); phi::funcs::ConjFunctor functor(x_data, numel, out_data); for_range(functor); } template void RealKernel(const Context& dev_ctx, const DenseTensor& x, DenseTensor* out) { auto numel = x.numel(); auto* x_data = x.data(); auto* out_data = dev_ctx.template Alloc>( out, static_cast(numel * sizeof(phi::dtype::Real))); phi::funcs::ForRange for_range(dev_ctx, numel); phi::funcs::RealFunctor functor(x_data, out_data, numel); for_range(functor); } template void ImagKernel(const Context& dev_ctx, const DenseTensor& x, DenseTensor* out) { auto numel = x.numel(); auto* x_data = x.data(); auto* out_data = dev_ctx.template Alloc>( out, static_cast(numel * sizeof(phi::dtype::Real))); phi::funcs::ForRange for_range(dev_ctx, numel); phi::funcs::ImagFunctor functor(x_data, out_data, numel); for_range(functor); } // functors to use with ElementwiseComputeEx template struct RealAndImagToComplexFunctor { inline HOSTDEVICE phi::dtype::complex operator()(const T x, const T y) { return phi::dtype::complex(x, y); } }; template struct ImagAndRealToComplexFunctor { inline HOSTDEVICE phi::dtype::complex operator()(const T y, const T x) { return phi::dtype::complex(x, y); } }; template void ComplexKernel(const Context& dev_ctx, const DenseTensor& x, const DenseTensor& y, DenseTensor* out) { using C = phi::dtype::complex; dev_ctx.template Alloc(out); // NOTE(chenfeiyu): be careful of the caveats of calling elementwise-related // facility functions #if defined(__NVCC__) || defined(__HIPCC__) phi::funcs::ElementwiseCompute, T, C>( dev_ctx, x, y, /*axis*/ -1, RealAndImagToComplexFunctor(), out); #else auto x_dims = x.dims(); auto y_dims = y.dims(); if (x_dims.size() >= y_dims.size()) { phi::funcs::ElementwiseCompute, T, C>( dev_ctx, x, y, /*axis*/ -1, RealAndImagToComplexFunctor(), out); } else { phi::funcs::ElementwiseCompute, T, C>( dev_ctx, x, y, /*axis*/ -1, ImagAndRealToComplexFunctor(), out); } #endif } } // namespace phi