scatter.h 2.4 KB
Newer Older
Z
zchen0211 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserve.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#pragma once
#include <cstring>

#include "paddle/framework/ddim.h"
#include "paddle/framework/eigen.h"
#include "paddle/framework/tensor.h"
#include "paddle/platform/place.h"

namespace paddle {
namespace operators {

using Tensor = framework::Tensor;

// Implementation of CPU copy
template <typename T>
Z
zchen0211 已提交
30 31 32 33
void CPUScatterAssign(const T* src, const int* index, const int slice_size,
                      const int index_size, T* output) {
  // paddle::framework::DDim output_dims = output->dims();
  const size_t slice_bytes = slice_size * sizeof(T);
Z
zchen0211 已提交
34

Z
zchen0211 已提交
35
  for (int i = 0; i < index_size; ++i) {
Z
zchen0211 已提交
36
    int index_ = index[i];
Z
zchen0211 已提交
37
    memcpy(output + index_ * slice_size, src + i * slice_size, slice_bytes);
Z
zchen0211 已提交
38 39 40 41 42
  }
}

/**
 * Return a updated tensor from source tensor, scattered according to index:
Z
zchen0211 已提交
43
 * dst[i] = src[index[i]]
Z
zchen0211 已提交
44 45 46 47 48
 * input[src]: type-T source Tensor
 * input[index]: type-int index Tensor (1-D)
 * return: output tensor
 */
template <typename T>
Z
zchen0211 已提交
49
void ScatterAssign(const platform::Place& place,
Z
zchen0211 已提交
50 51 52
                   const paddle::framework::Tensor* src,
                   const paddle::framework::Tensor* index,
                   paddle::framework::Tensor* output) {
Z
zchen0211 已提交
53
  PADDLE_ENFORCE(platform::is_cpu_place(place));
Z
zchen0211 已提交
54 55 56 57 58 59 60
  // check index of shape 1-D
  PADDLE_ENFORCE(index->dims().size() == 1);
  int index_size = index->dims()[0];

  auto src_dims = src->dims();
  auto dst_dims = output->dims();

Z
zchen0211 已提交
61 62 63 64
  const T* p_src = src->data<T>();
  const int* p_index = index->data<int>();
  T* p_output = output->data<T>();

Z
zchen0211 已提交
65
  // check src shape and dst shape should match
Z
zchen0211 已提交
66
  for (int i = 1; i < src_dims.size(); i++)
Z
zchen0211 已提交
67 68 69 70
    PADDLE_ENFORCE(src_dims[i] == dst_dims[i]);

  // slice size
  size_t slice_size = 1;
Z
zchen0211 已提交
71
  for (int i = 1; i < src_dims.size(); ++i) slice_size *= src_dims[i];
Z
zchen0211 已提交
72

Z
zchen0211 已提交
73
  CPUScatterAssign<T>(p_src, p_index, slice_size, index_size, p_output);
Z
zchen0211 已提交
74 75 76 77
}

}  // namespace operators
}  // namespace paddle