Merge pull request #5499 from reyoung/feature/increase_cpu

Feature/increase cpu

Merge pull request #5499 from reyoung/feature/increase_cpu
Feature/increase cpu
133f8903 · Yu Yang · GitHub · 78fb29bb · 9c10db36 · 133f8903
7 changed file
--- a/paddle/framework/backward.cc
+++ b/paddle/framework/backward.cc
@@ -408,6 +408,11 @@ std::vector<std::unique_ptr<OpDescBind>> MakeBlockBackward(
    for (const auto& desc : op_grads) {
      for (const std::string& out_name : desc->OutputArgumentNames()) {
+        if (out_name.find("@GRAD") == std::string::npos) {
+          // Not all outputs of a backward operator is a gradient. Only gradient
+          // need to be sum. Skip variables are not gradient.
+          continue;
+        }
        dup_out_ops[out_name].emplace_back(grad_desc_idx);
      }
      ++grad_desc_idx;

--- a/paddle/operators/increment_op.cc
+++ b/paddle/operators/increment_op.cc
@@ -12,22 +12,57 @@
   See the License for the specific language governing permissions and
   limitations under the License. */
-#include "paddle/operators/increment_op.h"
+#include "paddle/framework/op_registry.h"
 namespace paddle {
 namespace operators {
-class IncrementOp : public framework::OperatorWithKernel {
+class IncrementInferShape : public framework::InferShapeBase {
 public:
-  using framework::OperatorWithKernel::OperatorWithKernel;
+  void operator()(framework::InferShapeContext *ctx) const override {
-  void InferShape(framework::InferShapeContext *ctx) const override {
    PADDLE_ENFORCE(ctx->HasInput("X"),
                   "Input(X) of IncrementOp should not be null.");
    PADDLE_ENFORCE(ctx->HasOutput("Out"),
                   "Output(Out) of IncrementOp should not be null.");
+    PADDLE_ENFORCE_EQ(1, framework::product(ctx->GetInputDim("X")));
    ctx->SetOutputDim("Out", ctx->GetInputDim("X"));
-    ctx->ShareLoD("X", /*->*/ "Out");
+  }
+};
+struct IncrementFunctor {
+  IncrementFunctor(const framework::LoDTensor &x, framework::LoDTensor *out,
+                   float value)
+      : x_(x), out_(out), value_(value) {}
+  template <typename T>
+  void operator()() const {
+    *out_->data<T>() = *x_.data<T>() + static_cast<T>(value_);
+  }
+  const framework::LoDTensor &x_;
+  framework::LoDTensor *out_;
+  float value_;
+};
+class IncrementOp : public framework::OperatorBase {
+ public:
+  IncrementOp(const std::string &type, const framework::VariableNameMap &inputs,
+              const framework::VariableNameMap &outputs,
+              const framework::AttributeMap &attrs)
+      : OperatorBase(type, inputs, outputs, attrs) {}
+  void Run(const framework::Scope &scope,
+           const platform::DeviceContext &dev_ctx) const override {
+    auto &x = scope.FindVar(Input("X"))->Get<framework::LoDTensor>();
+    auto &out =
+        *scope.FindVar(Output("Out"))->GetMutable<framework::LoDTensor>();
+    PADDLE_ENFORCE(platform::is_cpu_place(x.place()));
+    out.Resize(x.dims());
+    out.mutable_data(x.place(), x.type());
+    float value = Attr<float>("step");
+    framework::VisitDataType(framework::ToDataType(out.type()),
+                             IncrementFunctor(x, &out, value));
  }
 };
@@ -59,10 +94,10 @@ class IncrementGradOpMaker : public framework::SingleGradOpDescMaker {
  std::unique_ptr<framework::OpDescBind> Apply() const override {
    auto *grad_op = new framework::OpDescBind();
-    grad_op->SetType("scale");
+    grad_op->SetType("increment");
-    grad_op->SetInput("X", OutputGrad("Out"));
+    grad_op->SetInput("X", Output("Out"));
-    grad_op->SetOutput("Out", InputGrad("X"));
+    grad_op->SetOutput("Out", Input("X"));
-    grad_op->SetAttr("scale", 1.0f);
+    grad_op->SetAttr("step", -boost::get<float>(GetAttr("step")));
    return std::unique_ptr<framework::OpDescBind>(grad_op);
  }
 };
@@ -71,11 +106,5 @@ class IncrementGradOpMaker : public framework::SingleGradOpDescMaker {
 }  // namespace paddle
 namespace ops = paddle::operators;
+REGISTER_OPERATOR(increment, ops::IncrementOp, ops::IncrementInferShape,
-REGISTER_OPERATOR(increment, ops::IncrementOp, ops::IncrementOpMaker,
+                  ops::IncrementOpMaker, ops::IncrementGradOpMaker);
-                  ops::IncrementGradOpMaker);
-REGISTER_OP_CPU_KERNEL(
-    increment, ops::IncrementKernel<paddle::platform::CPUPlace, float>,
-    ops::IncrementKernel<paddle::platform::CPUPlace, double>,
-    ops::IncrementKernel<paddle::platform::CPUPlace, int>,
-    ops::IncrementKernel<paddle::platform::CPUPlace, int64_t>);
--- a/paddle/operators/increment_op.cu
+++ b/paddle/operators/increment_op.cu
-/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserve.
-   Licensed under the Apache License, Version 2.0 (the "License");
-   you may not use this file except in compliance with the License.
-   You may obtain a copy of the License at
-   http://www.apache.org/licenses/LICENSE-2.0
-   Unless required by applicable law or agreed to in writing, software
-   distributed under the License is distributed on an "AS IS" BASIS,
-   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-   See the License for the specific language governing permissions and
-   limitations under the License. */
-#include "paddle/operators/increment_op.h"
-REGISTER_OP_GPU_KERNEL(
-    increment,
-    paddle::operators::IncrementKernel<paddle::platform::GPUPlace, float>,
-    paddle::operators::IncrementKernel<paddle::platform::GPUPlace, double>,
-    paddle::operators::IncrementKernel<paddle::platform::GPUPlace, int>,
-    paddle::operators::IncrementKernel<paddle::platform::GPUPlace, int64_t>);
--- a/paddle/operators/increment_op.h
+++ b/paddle/operators/increment_op.h
-/* Copyright (c) 2016 PaddlePaddle Authors. All Rights Reserve.
-   Licensed under the Apache License, Version 2.0 (the "License");
-   you may not use this file except in compliance with the License.
-   You may obtain a copy of the License at
-   http://www.apache.org/licenses/LICENSE-2.0
-   Unless required by applicable law or agreed to in writing, software
-   distributed under the License is distributed on an "AS IS" BASIS,
-   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-   See the License for the specific language governing permissions and
-   limitations under the License. */
-#pragma once
-#include "paddle/framework/eigen.h"
-#include "paddle/framework/op_registry.h"
-namespace paddle {
-namespace operators {
-template <typename Place, typename T>
-class IncrementKernel : public framework::OpKernel<T> {
- public:
-  virtual void Compute(const framework::ExecutionContext& context) const {
-    auto* tensor = context.Output<framework::Tensor>("Out");
-    auto* in = context.Input<framework::Tensor>("X");
-    tensor->mutable_data<T>(in->place());
-    auto step = static_cast<T>(context.Attr<float>("step"));
-    auto eigen_out = framework::EigenVector<T>::Flatten(*tensor);
-    auto eigen_in = framework::EigenVector<T>::Flatten(*in);
-    auto& place = context.GetEigenDevice<Place>();
-    eigen_out.device(place) = eigen_in + step;
-  }
-};
-}  // namespace operators
-}  // namespace paddle
--- a/python/paddle/v2/framework/layers.py
+++ b/python/paddle/v2/framework/layers.py
@@ -872,7 +872,7 @@ def array_to_lod_tensor(x, table, main_program=None):
 def fill_constant(shape, dtype, value, main_program=None):
-    helper = LayerHelper("ones", **locals())
+    helper = LayerHelper("fill_constant", **locals())
    out = helper.create_tmp_variable(dtype=dtype)
    helper.append_op(
        type='fill_constant',
@@ -895,9 +895,12 @@ def zeros(shape, dtype, main_program=None):
    return fill_constant(value=0.0, **locals())
-def increment(x, value=1.0, main_program=None):
+def increment(x, value=1.0, in_place=True, main_program=None):
    helper = LayerHelper("increment", **locals())
-    out = helper.create_tmp_variable(dtype=x.data_type)
+    if in_place:
+        out = x
+    else:
+        out = helper.create_tmp_variable(dtype=x.data_type)
    helper.append_op(
        type='increment',
        inputs={'X': [x]},

--- a/python/paddle/v2/framework/tests/test_array_read_write_op.py
+++ b/python/paddle/v2/framework/tests/test_array_read_write_op.py
@@ -20,21 +20,19 @@ class TestArrayReadWrite(unittest.TestCase):
            each_x.stop_gradient = False
        i = layers.zeros(shape=[1], dtype='int64')
+        i.stop_gradient = False
        arr = layers.array_write(x=x[0], i=i)
        i = layers.increment(x=i)
-        i.stop_gradient = True
        arr = layers.array_write(x=x[1], i=i, array=arr)
        i = layers.increment(x=i)
-        i.stop_gradient = True
        arr = layers.array_write(x=x[2], i=i, array=arr)
        i = layers.zeros(shape=[1], dtype='int64')
+        i.stop_gradient = False
        a0 = layers.array_read(array=arr, i=i)
        i = layers.increment(x=i)
-        i.stop_gradient = True  # index should not calculate gradient
        a1 = layers.array_read(array=arr, i=i)
        i = layers.increment(x=i)
-        i.stop_gradient = True
        a2 = layers.array_read(array=arr, i=i)
        mean_a0 = layers.mean(x=a0)

--- a/python/paddle/v2/framework/tests/test_increment_op.py
+++ b/python/paddle/v2/framework/tests/test_increment_op.py
-import unittest
-import numpy as np
-from op_test import OpTest
-class TestIncrementOpPositiveStep(OpTest):
-    """Test increment op with positive step
-    """
-    def setUp(self):
-        self.op_type = "increment"
-        self.inputs = {'X': np.random.random((10, 10)).astype("float32")}
-        self.attrs = {'step': 14.8}
-        self.outputs = {'Out': self.inputs['X'] + self.attrs['step']}
-    def test_check_output(self):
-        self.check_output()
-    def test_check_grad(self):
-        self.check_grad(['X'], 'Out')
-class TestIncrementOpNegativeStep(OpTest):
-    """Test increment op with negative step
-    """
-    def setUp(self):
-        self.op_type = "increment"
-        self.inputs = {'X': np.random.random((10, 10)).astype("float32")}
-        self.attrs = {'step': -3.8}
-        self.outputs = {'Out': self.inputs['X'] + self.attrs['step']}
-    def test_check_output(self):
-        self.check_output()
-    def test_check_grad(self):
-        self.check_grad(['X'], 'Out')
-if __name__ == "__main__":
-    unittest.main()