scatter_op.h 4.5 KB
Newer Older
1
/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserved.
Z
zchen0211 已提交
2 3 4 5 6 7 8 9 10 11 12 13 14 15

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License. */

#pragma once
Y
Yi Wang 已提交
16 17
#include "paddle/fluid/framework/eigen.h"
#include "paddle/fluid/framework/op_registry.h"
18 19
#include "paddle/fluid/operators/gather.h"
#include "paddle/fluid/operators/scatter.h"
Z
zchen0211 已提交
20 21 22 23 24 25

namespace paddle {
namespace operators {

using Tensor = framework::Tensor;

Z
zchen0211 已提交
26
template <typename T>
Y
Yu Yang 已提交
27
class ScatterOpKernel : public framework::OpKernel<T> {
Z
zchen0211 已提交
28 29
 public:
  void Compute(const framework::ExecutionContext &ctx) const override {
30 31 32
    PADDLE_ENFORCE_EQ(
        platform::is_cpu_place(ctx.GetPlace()), true,
        platform::errors::PreconditionNotMet("This kernel only runs on CPU."));
D
dzhwinter 已提交
33 34
    auto *X = ctx.Input<Tensor>("X");
    auto *Ids = ctx.Input<Tensor>("Ids");
Z
zchen0211 已提交
35 36
    auto *Updates = ctx.Input<Tensor>("Updates");
    auto *Out = ctx.Output<Tensor>("Out");
37
    double overwrite = ctx.Attr<bool>("overwrite");
Z
zchen0211 已提交
38

39
    // In place output: Out = X, Out[Ids] = Updates
40
    framework::TensorCopy(*X, ctx.GetPlace(), Out);
41
    // Apply ScatterUpdate: Out[index] = Updates[:]
42 43 44
    const auto &index_type = Ids->type();
    bool index_type_match = index_type == framework::proto::VarType::INT32 ||
                            index_type == framework::proto::VarType::INT64;
45 46 47 48 49 50 51 52 53
    PADDLE_ENFORCE_EQ(index_type_match, true,
                      platform::errors::InvalidArgument(
                          "Index holds the wrong type, it holds [%s],"
                          "but desires to be [%s] or [%s].",
                          paddle::framework::DataTypeToString(index_type),
                          paddle::framework::DataTypeToString(
                              framework::proto::VarType::INT32),
                          paddle::framework::DataTypeToString(
                              framework::proto::VarType::INT64)));
54 55 56 57 58 59 60 61 62 63 64 65 66
    if (overwrite) {
      if (index_type == framework::proto::VarType::INT32) {
        ScatterAssign<T, int32_t>(ctx.device_context(), *Updates, *Ids, Out);
      } else {
        ScatterAssign<T, int64_t>(ctx.device_context(), *Updates, *Ids, Out);
      }
    } else {
      if (index_type == framework::proto::VarType::INT32) {
        ScatterAssignAdd<T, int32_t>(ctx, *Updates, *Ids, Out);
      } else {
        ScatterAssignAdd<T, int64_t>(ctx, *Updates, *Ids, Out);
      }
    }
Z
zchen0211 已提交
67 68 69
  }
};

Z
zchen0211 已提交
70
template <typename T>
Y
Yu Yang 已提交
71
class ScatterGradientOpKernel : public framework::OpKernel<T> {
Z
zchen0211 已提交
72 73
 public:
  void Compute(const framework::ExecutionContext &ctx) const override {
74 75 76
    PADDLE_ENFORCE_EQ(
        platform::is_cpu_place(ctx.GetPlace()), true,
        platform::errors::PreconditionNotMet("This kernel only runs on CPU."));
D
dzhwinter 已提交
77
    auto *dX = ctx.Output<Tensor>(framework::GradVarName("X"));
Z
zchen0211 已提交
78
    auto *dUpdates = ctx.Output<Tensor>(framework::GradVarName("Updates"));
D
dzhwinter 已提交
79
    auto *Ids = ctx.Input<Tensor>("Ids");
Z
zchen0211 已提交
80
    auto *dOut = ctx.Input<Tensor>(framework::GradVarName("Out"));
Z
zchen0211 已提交
81

C
chengduo 已提交
82 83
    if (dX) {
      // In place gradient: dX = dO
84
      framework::TensorCopy(*dOut, ctx.GetPlace(), dX);
C
chengduo 已提交
85 86 87 88
    }
    if (dUpdates) {
      dUpdates->mutable_data<T>(ctx.GetPlace());
      // Gradient by Gather: dUpdates = dO[Ids]
89 90 91 92 93
      const auto &index_type = Ids->type();
      bool index_type_match = index_type == framework::proto::VarType::INT32 ||
                              index_type == framework::proto::VarType::INT64;
      PADDLE_ENFORCE_EQ(
          index_type_match, true,
94 95 96 97 98 99 100 101
          platform::errors::InvalidArgument(
              "scatter_op index holds the wrong type, it holds [%s],"
              "but desires to be [%s] or [%s]",
              paddle::framework::DataTypeToString(index_type),
              paddle::framework::DataTypeToString(
                  framework::proto::VarType::INT32),
              paddle::framework::DataTypeToString(
                  framework::proto::VarType::INT64)));
102 103 104 105 106
      if (index_type == framework::proto::VarType::INT32) {
        CPUGather<T, int32_t>(ctx.device_context(), *dOut, *Ids, dUpdates);
      } else {
        CPUGather<T, int64_t>(ctx.device_context(), *dOut, *Ids, dUpdates);
      }
C
chengduo 已提交
107
    }
Z
zchen0211 已提交
108 109 110 111 112
  }
};

}  // namespace operators
}  // namespace paddle