hashtable.h 3.4 KB
Newer Older
T
Thunderbrook 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
/* Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

  http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#pragma once
T
Thunderbrook 已提交
16
#include <glog/logging.h>
T
Thunderbrook 已提交
17 18 19
#include <limits>
#include <memory>
#include <vector>
T
Thunderbrook 已提交
20
#ifdef PADDLE_WITH_PSLIB
T
Thunderbrook 已提交
21
#include "common_value.h"  // NOLINT
T
Thunderbrook 已提交
22 23
#endif
#ifdef PADDLE_WITH_PSCORE
T
Thunderbrook 已提交
24
#include "paddle/fluid/distributed/table/depends/large_scale_kv.h"
T
Thunderbrook 已提交
25
#endif
26
#include "paddle/fluid/framework/rw_lock.h"
T
Thunderbrook 已提交
27
#include "thrust/pair.h"
28
// #include "cudf/concurrent_unordered_map.cuh.h"
T
Thunderbrook 已提交
29
#include "paddle/fluid/framework/fleet/heter_ps/cudf/concurrent_unordered_map.cuh.h"
30 31
#include "paddle/fluid/framework/fleet/heter_ps/feature_value.h"
#include "paddle/fluid/framework/fleet/heter_ps/mem_pool.h"
T
Thunderbrook 已提交
32
#ifdef PADDLE_WITH_HETERPS
33
#include "paddle/fluid/platform/device/gpu/gpu_types.h"
T
Thunderbrook 已提交
34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56

namespace paddle {
namespace framework {

template <typename KeyType, typename ValType>
class TableContainer
    : public concurrent_unordered_map<KeyType, ValType,
                                      std::numeric_limits<KeyType>::max()> {
 public:
  TableContainer(size_t capacity)
      : concurrent_unordered_map<KeyType, ValType,
                                 std::numeric_limits<KeyType>::max()>(
            capacity, ValType()) {}
};

template <typename KeyType, typename ValType>
class HashTable {
 public:
  HashTable(size_t capacity);
  virtual ~HashTable();
  HashTable(const HashTable&) = delete;
  HashTable& operator=(const HashTable&) = delete;
  void insert(const KeyType* d_keys, const ValType* d_vals, size_t len,
57
              gpuStream_t stream);
58 59
  void insert(const KeyType* d_keys, size_t len, char* pool, size_t start_index,
              gpuStream_t stream);
T
Thunderbrook 已提交
60
  void get(const KeyType* d_keys, ValType* d_vals, size_t len,
61
           gpuStream_t stream);
62
  void get(const KeyType* d_keys, char* d_vals, size_t len, gpuStream_t stream);
T
Thunderbrook 已提交
63
  void show();
T
Thunderbrook 已提交
64
  void dump_to_cpu(int devid, cudaStream_t stream);
T
Thunderbrook 已提交
65 66 67

  template <typename GradType, typename Sgd>
  void update(const KeyType* d_keys, const GradType* d_grads, size_t len,
68
              Sgd sgd, gpuStream_t stream);
T
Thunderbrook 已提交
69

70 71 72 73
  template <typename Sgd>
  void update(const KeyType* d_keys, const char* d_grads, size_t len, Sgd sgd,
              gpuStream_t stream);

74 75
  int size() { return container_->size(); }

76 77 78 79 80 81 82 83
  void set_feature_value_size(size_t pull_feature_value_size,
                              size_t push_grad_value_size) {
    pull_feature_value_size_ = pull_feature_value_size;
    push_grad_value_size_ = push_grad_value_size;
    VLOG(3) << "hashtable set pull value size: " << pull_feature_value_size_
            << " push value size: " << push_grad_value_size_;
  }

84 85
  std::unique_ptr<RWLock> rwlock_{nullptr};

T
Thunderbrook 已提交
86 87 88 89 90
 private:
  TableContainer<KeyType, ValType>* container_;
  int BLOCK_SIZE_{256};
  float LOAD_FACTOR{0.75f};
  size_t capacity_;
91 92 93
  size_t max_mf_dim_ = 8;
  size_t pull_feature_value_size_;
  size_t push_grad_value_size_;
T
Thunderbrook 已提交
94 95 96
};
}  // end namespace framework
}  // end namespace paddle
T
Thunderbrook 已提交
97
#include "hashtable_inl.h"
T
Thunderbrook 已提交
98
#endif