transform.h 3.7 KB
Newer Older
Y
Yu Yang 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserve.

   Licensed under the Apache License, Version 2.0 (the "License");
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

   http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an "AS IS" BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License. */

#pragma once

Y
Yu Yang 已提交
17
#include "paddle/platform/device_context.h"
Y
Yu Yang 已提交
18 19 20 21 22
#include "paddle/platform/enforce.h"
#include "paddle/platform/hostdevice.h"
#include "paddle/platform/place.h"

#include <algorithm>
Y
Yu Yang 已提交
23
#include <type_traits>
Y
Yu Yang 已提交
24
#ifdef __NVCC__
Y
Yu Yang 已提交
25
#include <thrust/execution_policy.h>
Y
Yu Yang 已提交
26
#include <thrust/transform.h>
27
#include "paddle/platform/details/device_ptr_cast.h"
Y
Yu Yang 已提交
28 29 30 31
#endif

namespace paddle {
namespace platform {
32

Y
Yu Yang 已提交
33
// Transform on host or device. It provides the same API in std library.
34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51
template <typename Place>
struct Transform {
  template <typename InputIter, typename OutputIter, typename UnaryOperation>
  void operator()(const DeviceContext& context, InputIter first, InputIter last,
                  OutputIter result, UnaryOperation op);

  template <typename InputIter1, typename InputIter2, typename OutputIter,
            typename BinaryOperation>
  void operator()(const DeviceContext& context, InputIter1 first1,
                  InputIter1 last1, InputIter2 first2, OutputIter result,
                  BinaryOperation op);
};

template <>
struct Transform<platform::CPUPlace> {
  template <typename InputIter, typename OutputIter, typename UnaryOperation>
  void operator()(const DeviceContext& context, InputIter first, InputIter last,
                  OutputIter result, UnaryOperation op) {
Y
Yu Yang 已提交
52 53 54
    std::transform(first, last, result, op);
  }

55 56 57 58 59
  template <typename InputIter1, typename InputIter2, typename OutputIter,
            typename BinaryOperation>
  void operator()(const DeviceContext& context, InputIter1 first1,
                  InputIter1 last1, InputIter2 first2, OutputIter result,
                  BinaryOperation op) {
Y
Yu Yang 已提交
60
    std::transform(first1, last1, first2, result, op);
61 62 63
  }
};

Y
Yu Yang 已提交
64
#ifdef __NVCC__
65 66 67 68 69 70 71
template <>
struct Transform<platform::GPUPlace> {
  template <typename InputIter, typename OutputIter, typename UnaryOperation>
  void operator()(const DeviceContext& context, InputIter first, InputIter last,
                  OutputIter result, UnaryOperation op) {
    auto place = context.GetPlace();
    PADDLE_ENFORCE(is_gpu_place(place), "It must use GPU place.");
Y
Yu Yang 已提交
72
    auto& ctx = reinterpret_cast<const CUDADeviceContext&>(context);
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88
    thrust::transform(thrust::cuda::par.on(ctx.stream()),
                      details::DevPtrCast(first), details::DevPtrCast(last),
                      details::DevPtrCast(result), op);
  }

  template <typename InputIter1, typename InputIter2, typename OutputIter,
            typename BinaryOperation>
  void operator()(const DeviceContext& context, InputIter1 first1,
                  InputIter1 last1, InputIter2 first2, OutputIter result,
                  BinaryOperation op) {
    auto place = context.GetPlace();
    PADDLE_ENFORCE(is_gpu_place(place), "It must use GPU place.");
    auto& ctx = reinterpret_cast<const CUDADeviceContext&>(context);
    thrust::transform(thrust::cuda::par.on(ctx.stream()),
                      details::DevPtrCast(first1), details::DevPtrCast(last1),
                      details::DevPtrCast(first2), details::DevPtrCast(result),
Y
Yu Yang 已提交
89
                      op);
Y
Yu Yang 已提交
90 91
  }
};
92
#endif
Y
Yu Yang 已提交
93 94 95

}  // namespace platform
}  // namespace paddle