algorithm.h 2.5 KB
Newer Older
S
sneaxiy 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41
// Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#pragma once

#include <algorithm>
#include <cstdint>  // for int64_t
#include <numeric>

#include "paddle/fluid/platform/hostdevice.h"

namespace paddle {
namespace operators {
namespace math {

template <typename T>
HOSTDEVICE inline int64_t BinarySearch(const T *x, int64_t num, const T &val) {
  int64_t beg = 0, end = num - 1;
  while (beg <= end) {
    auto mid = ((beg + end) >> 1);
    if (x[mid] == val)
      return mid;
    else if (x[mid] < val)
      beg = mid + 1;
    else
      end = mid - 1;
  }
  return -1;
}

S
sneaxiy 已提交
42 43
template <typename T>
HOSTDEVICE inline size_t LowerBound(const T *x, size_t num, const T &val) {
44
#if defined(__CUDA_ARCH__) || defined(__HIPCC__)  // @{ Group LowerBound
S
sneaxiy 已提交
45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61
  // The following code is from
  // https://en.cppreference.com/w/cpp/algorithm/lower_bound
  auto *first = x;
  int64_t count = static_cast<int64_t>(num);
  while (count > 0) {
    int64_t step = (count >> 1);
    auto *it = first + step;
    if (*it < val) {
      first = ++it;
      count -= (step + 1);
    } else {
      count = step;
    }
  }
  return static_cast<size_t>(first - x);
#else
  return static_cast<size_t>(std::lower_bound(x, x + num, val) - x);
62
#endif  // @} End Group LowerBound
S
sneaxiy 已提交
63 64 65 66
}

template <typename T>
HOSTDEVICE inline size_t UpperBound(const T *x, size_t num, const T &val) {
67
#if defined(__CUDA_ARCH__) || defined(__HIPCC__)  // @{ Group UpperBound
S
sneaxiy 已提交
68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84
  // The following code is from
  // https://en.cppreference.com/w/cpp/algorithm/upper_bound
  auto *first = x;
  int64_t count = static_cast<int64_t>(num);
  while (count > 0) {
    auto step = (count >> 1);
    auto *it = first + step;
    if (val < *it) {
      count = step;
    } else {
      first = ++it;
      count -= (step + 1);
    }
  }
  return static_cast<size_t>(first - x);
#else
  return static_cast<size_t>(std::upper_bound(x, x + num, val) - x);
85
#endif  // @} End Group UpperBound
S
sneaxiy 已提交
86 87
}

S
sneaxiy 已提交
88 89 90
}  // namespace math
}  // namespace operators
}  // namespace paddle