heter_ps.h 3.2 KB
Newer Older
T
Thunderbrook 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
/* Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

  http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#pragma once
#include <vector>
17

T
Thunderbrook 已提交
18 19
#include "paddle/fluid/framework/fleet/heter_ps/heter_comm.h"
#include "paddle/fluid/framework/fleet/heter_ps/heter_ps_base.h"
20
#if defined(PADDLE_WITH_CUDA)
T
Thunderbrook 已提交
21
#include "paddle/fluid/framework/fleet/heter_ps/optimizer.cuh.h"
22
#endif
T
Thunderbrook 已提交
23

T
Thunderbrook 已提交
24
#ifdef PADDLE_WITH_HETERPS
T
Thunderbrook 已提交
25 26 27 28

namespace paddle {
namespace framework {

D
danleifeng 已提交
29
template <typename GPUAccessor, template <typename T> class GPUOptimizer>
T
Thunderbrook 已提交
30 31 32
class HeterPs : public HeterPsBase {
 public:
  HeterPs() {}
D
danleifeng 已提交
33 34
  HeterPs(size_t capacity,
          std::shared_ptr<HeterPsResource> resource,
D
danleifeng 已提交
35
          GPUAccessor& gpu_accessor);
T
Thunderbrook 已提交
36 37 38 39
  virtual ~HeterPs();
  HeterPs(const HeterPs&) = delete;
  HeterPs& operator=(const HeterPs&) = delete;

40 41
  void pull_sparse(int num,
                   FeatureKey* d_keys,
D
danleifeng 已提交
42
                   float* d_vals,
43
                   size_t len) override;
D
danleifeng 已提交
44 45
  // void build_ps(int num, FeatureKey* h_keys, float* h_vals, size_t len,
  //               size_t chunk_size, int stream_num) override;
46 47 48 49 50 51
  void build_ps(int num,
                FeatureKey* h_keys,
                char* pool,
                size_t len,
                size_t feature_value_size,
                size_t chunk_size,
Y
yaoxuefeng 已提交
52
                int stream_num) override;
53
#if defined(PADDLE_WITH_CUDA)
54 55 56
  void set_nccl_comm_and_size(const std::vector<ncclComm_t>& inner_comms,
                              const std::vector<ncclComm_t>& inter_comms,
                              int comm_size) override;
Y
yaoxuefeng 已提交
57
  void set_multi_mf_dim(int multi_mf_dim, int max_mf_dim) override;
D
danleifeng 已提交
58

59 60
#endif

61 62 63 64 65 66
  void set_sparse_sgd(const OptimizerConfig& optimizer_config) override;
  void set_embedx_sgd(const OptimizerConfig& optimizer_config) override;

  void end_pass() override;
  int get_index_by_devid(int devid) override;
  void show_one_table(int gpu_num) override;
D
danleifeng 已提交
67 68 69 70 71 72 73 74 75 76 77 78 79 80 81
  void push_sparse(int num, FeatureKey* d_keys, float* d_grads, size_t len);
  void show_table_collisions() override;
#if defined(PADDLE_WITH_CUDA)
  // dedup
  int dedup_keys_and_fillidx(const int gpu_id,
                             const int total_fea_num,
                             const FeatureKey* d_keys,   // input
                             FeatureKey* d_merged_keys,  // output
                             FeatureKey* d_sorted_keys,
                             uint32_t* d_restore_idx,
                             uint32_t* d_sorted_idx,
                             uint32_t* d_offset,
                             uint32_t* d_merged_cnts,
                             bool filter_zero);
#endif
T
Thunderbrook 已提交
82
 private:
D
danleifeng 已提交
83
  std::shared_ptr<HeterComm<FeatureKey, float*, float*, GPUAccessor>> comm_;
84
#if defined(PADDLE_WITH_CUDA)
D
danleifeng 已提交
85
  GPUOptimizer<GPUAccessor> opt_;
86
#endif
T
Thunderbrook 已提交
87 88 89 90 91
};

}  // end namespace framework
}  // end namespace paddle
#endif