transform.h 3.9 KB
Newer Older
Y
Yu Yang 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserve.

   Licensed under the Apache License, Version 2.0 (the "License");
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

   http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an "AS IS" BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License. */

#pragma once

Y
Yu Yang 已提交
17
#include "paddle/platform/device_context.h"
Y
Yu Yang 已提交
18 19 20 21 22
#include "paddle/platform/enforce.h"
#include "paddle/platform/hostdevice.h"
#include "paddle/platform/place.h"

#include <algorithm>
Y
Yu Yang 已提交
23
#include <type_traits>
Y
Yu Yang 已提交
24
#ifdef __NVCC__
Y
Yu Yang 已提交
25
#include <thrust/execution_policy.h>
Y
Yu Yang 已提交
26
#include <thrust/transform.h>
27
#include "paddle/platform/details/device_ptr_cast.h"
Y
Yu Yang 已提交
28 29 30 31
#endif

namespace paddle {
namespace platform {
32

Y
Yu Yang 已提交
33
// Transform on host or device. It provides the same API in std library.
34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53
template <typename Place>
struct Transform {
  template <typename InputIter, typename OutputIter, typename UnaryOperation>
  void operator()(const DeviceContext& context, InputIter first, InputIter last,
                  OutputIter result, UnaryOperation op);

  template <typename InputIter1, typename InputIter2, typename OutputIter,
            typename BinaryOperation>
  void operator()(const DeviceContext& context, InputIter1 first1,
                  InputIter1 last1, InputIter2 first2, OutputIter result,
                  BinaryOperation op);
};

template <>
struct Transform<platform::CPUPlace> {
  template <typename InputIter, typename OutputIter, typename UnaryOperation>
  void operator()(const DeviceContext& context, InputIter first, InputIter last,
                  OutputIter result, UnaryOperation op) {
    auto place = context.GetPlace();
    PADDLE_ENFORCE(is_cpu_place(place), "It must use CPU place.");
Y
Yu Yang 已提交
54 55 56
    std::transform(first, last, result, op);
  }

57 58 59 60 61 62 63
  template <typename InputIter1, typename InputIter2, typename OutputIter,
            typename BinaryOperation>
  void operator()(const DeviceContext& context, InputIter1 first1,
                  InputIter1 last1, InputIter2 first2, OutputIter result,
                  BinaryOperation op) {
    auto place = context.GetPlace();
    PADDLE_ENFORCE(is_cpu_place(place), "It must use CPU place.");
Y
Yu Yang 已提交
64
    std::transform(first1, last1, first2, result, op);
65 66 67
  }
};

Y
Yu Yang 已提交
68
#ifdef __NVCC__
69 70 71 72 73 74 75
template <>
struct Transform<platform::GPUPlace> {
  template <typename InputIter, typename OutputIter, typename UnaryOperation>
  void operator()(const DeviceContext& context, InputIter first, InputIter last,
                  OutputIter result, UnaryOperation op) {
    auto place = context.GetPlace();
    PADDLE_ENFORCE(is_gpu_place(place), "It must use GPU place.");
Y
Yu Yang 已提交
76
    auto& ctx = reinterpret_cast<const CUDADeviceContext&>(context);
77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92
    thrust::transform(thrust::cuda::par.on(ctx.stream()),
                      details::DevPtrCast(first), details::DevPtrCast(last),
                      details::DevPtrCast(result), op);
  }

  template <typename InputIter1, typename InputIter2, typename OutputIter,
            typename BinaryOperation>
  void operator()(const DeviceContext& context, InputIter1 first1,
                  InputIter1 last1, InputIter2 first2, OutputIter result,
                  BinaryOperation op) {
    auto place = context.GetPlace();
    PADDLE_ENFORCE(is_gpu_place(place), "It must use GPU place.");
    auto& ctx = reinterpret_cast<const CUDADeviceContext&>(context);
    thrust::transform(thrust::cuda::par.on(ctx.stream()),
                      details::DevPtrCast(first1), details::DevPtrCast(last1),
                      details::DevPtrCast(first2), details::DevPtrCast(result),
Y
Yu Yang 已提交
93
                      op);
Y
Yu Yang 已提交
94 95
  }
};
96
#endif
Y
Yu Yang 已提交
97 98 99

}  // namespace platform
}  // namespace paddle