heter_ps.h 3.5 KB
Newer Older
T
Thunderbrook 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
/* Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

  http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#pragma once
#include <vector>
17

T
Thunderbrook 已提交
18 19
#include "paddle/fluid/framework/fleet/heter_ps/heter_comm.h"
#include "paddle/fluid/framework/fleet/heter_ps/heter_ps_base.h"
20
#if defined(PADDLE_WITH_CUDA)
T
Thunderbrook 已提交
21
#include "paddle/fluid/framework/fleet/heter_ps/optimizer.cuh.h"
22
#endif
T
Thunderbrook 已提交
23

T
Thunderbrook 已提交
24
#ifdef PADDLE_WITH_HETERPS
T
Thunderbrook 已提交
25 26 27 28

namespace paddle {
namespace framework {

D
danleifeng 已提交
29
template <typename GPUAccessor, template <typename T> class GPUOptimizer>
T
Thunderbrook 已提交
30 31 32
class HeterPs : public HeterPsBase {
 public:
  HeterPs() {}
D
danleifeng 已提交
33 34
  HeterPs(size_t capacity,
          std::shared_ptr<HeterPsResource> resource,
35
          GPUAccessor& gpu_accessor);  // NOLINT
T
Thunderbrook 已提交
36 37 38 39
  virtual ~HeterPs();
  HeterPs(const HeterPs&) = delete;
  HeterPs& operator=(const HeterPs&) = delete;

40 41
  void pull_sparse(int num,
                   FeatureKey* d_keys,
D
danleifeng 已提交
42
                   float* d_vals,
43
                   size_t len) override;
44 45 46 47 48 49
  void build_ps(int num,
                FeatureKey* h_keys,
                char* pool,
                size_t len,
                size_t feature_value_size,
                size_t chunk_size,
Y
yaoxuefeng 已提交
50
                int stream_num) override;
51
#if defined(PADDLE_WITH_CUDA)
52 53
  void set_nccl_comm_and_size(const std::vector<ncclComm_t>& inner_comms,
                              const std::vector<ncclComm_t>& inter_comms,
L
lxsbupt 已提交
54 55
                              int comm_size,
                              int rank_id) override;
Y
yaoxuefeng 已提交
56
  void set_multi_mf_dim(int multi_mf_dim, int max_mf_dim) override;
D
danleifeng 已提交
57

58 59
#endif

60 61 62 63 64 65
  void set_sparse_sgd(const OptimizerConfig& optimizer_config) override;
  void set_embedx_sgd(const OptimizerConfig& optimizer_config) override;

  void end_pass() override;
  int get_index_by_devid(int devid) override;
  void show_one_table(int gpu_num) override;
D
danleifeng 已提交
66 67 68 69 70 71 72 73 74 75 76 77 78 79 80
  void push_sparse(int num, FeatureKey* d_keys, float* d_grads, size_t len);
  void show_table_collisions() override;
#if defined(PADDLE_WITH_CUDA)
  // dedup
  int dedup_keys_and_fillidx(const int gpu_id,
                             const int total_fea_num,
                             const FeatureKey* d_keys,   // input
                             FeatureKey* d_merged_keys,  // output
                             FeatureKey* d_sorted_keys,
                             uint32_t* d_restore_idx,
                             uint32_t* d_sorted_idx,
                             uint32_t* d_offset,
                             uint32_t* d_merged_cnts,
                             bool filter_zero);
#endif
L
lxsbupt 已提交
81 82 83 84 85 86 87 88 89 90
  // reset table
  void reset_table(const int dev_id,
                   size_t capacity,
                   const OptimizerConfig& sgd_config,
                   const OptimizerConfig& embedx_config,
                   bool infer_mode) {
    comm_->reset_table(dev_id, capacity, sgd_config, embedx_config, infer_mode);
  }
  void set_mode(bool infer_mode) { comm_->set_mode(infer_mode); }

T
Thunderbrook 已提交
91
 private:
D
danleifeng 已提交
92
  std::shared_ptr<HeterComm<FeatureKey, float*, float*, GPUAccessor>> comm_;
93
#if defined(PADDLE_WITH_CUDA)
D
danleifeng 已提交
94
  GPUOptimizer<GPUAccessor> opt_;
95
#endif
T
Thunderbrook 已提交
96 97 98 99 100
};

}  // end namespace framework
}  // end namespace paddle
#endif