complex_kernel_impl.h 3.7 KB
Newer Older
C
chentianyu03 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
// Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#pragma once

C
Chen Weihang 已提交
17
// See Note [ Why still include the fluid headers? ]
18
#include "paddle/phi/kernels/funcs/broadcast_function.h"
19
#include "paddle/phi/kernels/funcs/complex_functors.h"
20
#include "paddle/phi/kernels/funcs/elementwise_base.h"
C
Chen Weihang 已提交
21
#include "paddle/phi/kernels/funcs/for_range.h"
C
chentianyu03 已提交
22

23
namespace phi {
C
chentianyu03 已提交
24

25
template <typename T, typename Context>
26
void ConjKernel(const Context& dev_ctx,
27 28
                const DenseTensor& x,
                DenseTensor* out) {
C
chentianyu03 已提交
29 30
  auto numel = x.numel();
  auto* x_data = x.data<T>();
31
  auto* out_data = dev_ctx.template Alloc<T>(out);
C
chentianyu03 已提交
32

C
Chen Weihang 已提交
33
  phi::funcs::ForRange<Context> for_range(dev_ctx, numel);
34
  phi::funcs::ConjFunctor<T> functor(x_data, numel, out_data);
C
chentianyu03 已提交
35 36 37
  for_range(functor);
}

F
From00 已提交
38 39 40 41 42 43
template <typename T, typename Context>
void RealKernel(const Context& dev_ctx,
                const DenseTensor& x,
                DenseTensor* out) {
  auto numel = x.numel();
  auto* x_data = x.data<T>();
44 45
  auto* out_data = dev_ctx.template Alloc<phi::dtype::Real<T>>(
      out, static_cast<size_t>(numel * sizeof(phi::dtype::Real<T>)));
F
From00 已提交
46

C
Chen Weihang 已提交
47
  phi::funcs::ForRange<Context> for_range(dev_ctx, numel);
F
From00 已提交
48 49 50 51 52 53 54 55 56 57
  phi::funcs::RealFunctor<T> functor(x_data, out_data, numel);
  for_range(functor);
}

template <typename T, typename Context>
void ImagKernel(const Context& dev_ctx,
                const DenseTensor& x,
                DenseTensor* out) {
  auto numel = x.numel();
  auto* x_data = x.data<T>();
58 59
  auto* out_data = dev_ctx.template Alloc<phi::dtype::Real<T>>(
      out, static_cast<size_t>(numel * sizeof(phi::dtype::Real<T>)));
F
From00 已提交
60

C
Chen Weihang 已提交
61
  phi::funcs::ForRange<Context> for_range(dev_ctx, numel);
F
From00 已提交
62 63 64 65
  phi::funcs::ImagFunctor<T> functor(x_data, out_data, numel);
  for_range(functor);
}

66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106
// functors to use with ElementwiseComputeEx
template <typename T>
struct RealAndImagToComplexFunctor {
  inline HOSTDEVICE phi::dtype::complex<T> operator()(const T x, const T y) {
    return phi::dtype::complex<T>(x, y);
  }
};

template <typename T>
struct ImagAndRealToComplexFunctor {
  inline HOSTDEVICE phi::dtype::complex<T> operator()(const T y, const T x) {
    return phi::dtype::complex<T>(x, y);
  }
};

template <typename T, typename Context>
void ComplexKernel(const Context& dev_ctx,
                   const DenseTensor& x,
                   const DenseTensor& y,
                   DenseTensor* out) {
  using C = phi::dtype::complex<T>;
  dev_ctx.template Alloc<C>(out);

// NOTE(chenfeiyu): be careful of the caveats of calling elementwise-related
// facility functions
#if defined(__NVCC__) || defined(__HIPCC__)
  phi::funcs::ElementwiseCompute<RealAndImagToComplexFunctor<T>, T, C>(
      dev_ctx, x, y, /*axis*/ -1, RealAndImagToComplexFunctor<T>(), out);
#else
  auto x_dims = x.dims();
  auto y_dims = y.dims();
  if (x_dims.size() >= y_dims.size()) {
    phi::funcs::ElementwiseCompute<RealAndImagToComplexFunctor<T>, T, C>(
        dev_ctx, x, y, /*axis*/ -1, RealAndImagToComplexFunctor<T>(), out);
  } else {
    phi::funcs::ElementwiseCompute<ImagAndRealToComplexFunctor<T>, T, C>(
        dev_ctx, x, y, /*axis*/ -1, ImagAndRealToComplexFunctor<T>(), out);
  }
#endif
}

107
}  // namespace phi