From 6be0ee159e508b1e5c418bfc47b7964cf77b337d Mon Sep 17 00:00:00 2001
From: Aurelius84 <liujiezhangbupt@gmail.com>
Date: Mon, 8 Jun 2020 12:23:34 +0800
Subject: [PATCH] Support LoDTensorArray in reverse_op (#24797)

* Support LoDTensorArray in reverse_op test=develop

* polish en doc and unittest code test=develop

* refine sample code test=develop

* add example of LoDTensorArray test=develop

* fix typo test=develop
---
 paddle/fluid/operators/reverse_op.cc          | 44 +++++++++---
 paddle/fluid/operators/reverse_op.h           | 22 +++++-
 python/paddle/fluid/layers/tensor.py          | 40 ++++++++++-
 .../fluid/tests/unittests/test_reverse_op.py  | 71 +++++++++++++++++++
 4 files changed, 165 insertions(+), 12 deletions(-)
diff --git a/paddle/fluid/operators/reverse_op.cc b/paddle/fluid/operators/reverse_op.cc
index 1f01841974..8b2b9f464b 100644
--- a/paddle/fluid/operators/reverse_op.cc
+++ b/paddle/fluid/operators/reverse_op.cc
@@ -24,14 +24,31 @@ class ReverseOp : public framework::OperatorWithKernel {
   using framework::OperatorWithKernel::OperatorWithKernel;
 
   void InferShape(framework::InferShapeContext* ctx) const override {
-    PADDLE_ENFORCE_EQ(
-        ctx->HasInput("X"), true,
-        platform::errors::InvalidArgument("Input(X) should not be null"));
-    PADDLE_ENFORCE_EQ(
-        ctx->HasOutput("Out"), true,
-        platform::errors::InvalidArgument("Output(Out) should not be null"));
-    const auto& x_dims = ctx->GetInputDim("X");
+    OP_INOUT_CHECK(ctx->HasInput("X"), "Input", "X", "Reverse");
+    OP_INOUT_CHECK(ctx->HasOutput("Out"), "Output", "Out", "Reverse");
+
+    auto x_var_type = ctx->GetInputsVarType("X")[0];
     const auto& axis = ctx->Attrs().Get<std::vector<int>>("axis");
+    if (x_var_type == framework::proto::VarType::LOD_TENSOR_ARRAY) {
+      PADDLE_ENFORCE_EQ(
+          axis.size(), 1,
+          platform::errors::InvalidArgument(
+              "The size of axis must be 1 when the Input(X) is LoDTensorArray, "
+              "but received %d.",
+              axis.size()));
+      PADDLE_ENFORCE_EQ(axis[0], 0, platform::errors::InvalidArgument(
+                                        "The value of axis should be 1 when "
+                                        "the Input(X) is LoDTensorArray, "
+                                        "but received %d.",
+                                        axis[0]));
+      // In runtime, shape is determined by RunImpl.
+      if (!ctx->IsRuntime()) {
+        const auto& x_dims = ctx->GetInputDim("X");
+        ctx->SetOutputDim("Out", x_dims);
+      }
+      return;
+    }
+    const auto& x_dims = ctx->GetInputDim("X");
     PADDLE_ENFORCE_NE(axis.empty(), true, platform::errors::InvalidArgument(
                                               "'axis' can not be empty."));
     for (int a : axis) {
@@ -51,6 +68,14 @@ class ReverseOp : public framework::OperatorWithKernel {
   }
 };
 
+class ReverseOpVarTypeInference : public framework::VarTypeInference {
+ public:
+  void operator()(framework::InferVarTypeContext* ctx) const override {
+    ctx->SetOutputType("Out", ctx->GetInputType("X"));
+    ctx->SetOutputDataType("Out", ctx->GetInputDataType("X"));
+  }
+};
+
 class ReverseOpMaker : public framework::OpProtoAndCheckerMaker {
  public:
   void Make() override {
@@ -111,8 +136,9 @@ class ReverseGradMaker : public framework::SingleGradOpMaker<T> {
 namespace ops = paddle::operators;
 REGISTER_OPERATOR(reverse, ops::ReverseOp, ops::ReverseOpMaker,
                   ops::ReverseGradMaker<paddle::framework::OpDesc>,
-                  ops::ReverseGradMaker<paddle::imperative::OpBase>);
-REGISTER_OPERATOR(reverse_grad, ops::ReverseOp);
+                  ops::ReverseGradMaker<paddle::imperative::OpBase>,
+                  ops::ReverseOpVarTypeInference);
+REGISTER_OPERATOR(reverse_grad, ops::ReverseOp, ops::ReverseOpVarTypeInference);
 REGISTER_OP_CPU_KERNEL(
     reverse, ops::ReverseKernel<paddle::platform::CPUDeviceContext, int>,
     ops::ReverseKernel<paddle::platform::CPUDeviceContext, uint8_t>,
diff --git a/paddle/fluid/operators/reverse_op.h b/paddle/fluid/operators/reverse_op.h
index 24489e618d..2813f7a486 100644
--- a/paddle/fluid/operators/reverse_op.h
+++ b/paddle/fluid/operators/reverse_op.h
@@ -47,10 +47,30 @@ template <typename DeviceContext, typename T>
 class ReverseKernel : public framework::OpKernel<T> {
  public:
   void Compute(const framework::ExecutionContext& context) const override {
+    auto* x_var = context.InputVar("X");
+    const auto& axis = context.Attr<std::vector<int>>("axis");
+    if (x_var->IsType<framework::LoDTensorArray>()) {
+      auto& x_array = x_var->Get<framework::LoDTensorArray>();
+      auto* out_array = context.Output<framework::LoDTensorArray>("Out");
+
+      out_array->resize(x_array.size());
+      for (size_t offset = 0; offset < x_array.size(); offset++) {
+        auto& x_tensor = x_array.at(offset);
+        PADDLE_ENFORCE_GT(
+            x_tensor.memory_size(), 0,
+            platform::errors::PreconditionNotMet(
+                "The input LoDTensorArray X[%d] holds no memory.", offset));
+        auto out_offset = x_array.size() - offset - 1;
+        auto* out_tensor = &out_array->at(out_offset);
+
+        out_tensor->set_lod(x_tensor.lod());
+        TensorCopy(x_tensor, context.GetPlace(), out_tensor);
+      }
+      return;
+    }
     auto* x = context.Input<framework::LoDTensor>("X");
     auto* out = context.Output<framework::LoDTensor>("Out");
     out->mutable_data<T>(context.GetPlace());
-    const auto& axis = context.Attr<std::vector<int>>("axis");
     int rank = x->dims().size();
     auto& dev_ctx = context.template device_context<DeviceContext>();
 
diff --git a/python/paddle/fluid/layers/tensor.py b/python/paddle/fluid/layers/tensor.py
index e81af19b6f..a7f10584b7 100644
--- a/python/paddle/fluid/layers/tensor.py
+++ b/python/paddle/fluid/layers/tensor.py
@@ -1094,11 +1094,37 @@ def reverse(x, axis):
 
     The OP reverses the tensor :attr:`x` along the given :attr:`axis`.
 
+    .. code-block:: text
+
+        Case 1:
+
+            Given a LoDTensor:
+                x = [[0, 1, 2], [3, 4, 5], [6, 7, 8]]
+                axis = [0, 1]
+
+            Then:
+                output = [[8, 7, 6], [5, 4, 3], [2, 1, 0]]
+
+        Case 2:
+
+            Given a LoDTensorArray:
+                x = {[[0, 1], [2, 3]],
+                     [[4, 5, 6]],
+                     [[7],[8], [9]]}
+                axis = 0
+
+            Then:
+                output = {[[7],[8], [9]],
+                          [[4, 5, 6]],
+                          [[0, 1], [2, 3]]}
+
     Parameters:
-        x (Variable): A tensor to be reversed, its data type supports bool, float32, float64, int32, int64 and uint8.
+        x (Variable): A tensor or LoDTensorArray to be reversed, its data type supports bool, float32, float64, int32, int64 and uint8.
+                      If input is a LoDTensorArray, returns a new reversed LoDTensorArray without changing the internal order of each inner tensor.
         axis (int|tuple|list): A dimension or a set of dimensions of :attr:`x` to reverse. Must be
             in the range [-rank( :attr:`x` ), rank( :attr:`x` )). If it is a tuple or a list, reversing
-            will be apply on each axis in the tuple or list.
+            will be apply on each axis in the tuple or list. If input is a LoDTensorArray, the value of axis shall be 0, or a
+            list [0] or tuple (0, ) with shape [1].
 
     Returns:
         Variable: The reversed tensor with the same shape and data type as :attr:`x`.
@@ -1111,6 +1137,16 @@ def reverse(x, axis):
           data = fluid.layers.assign(np.array([[0, 1, 2], [3, 4, 5], [6, 7, 8]], dtype='float32')) # [[0., 1., 2.], [3., 4., 5.], [6., 7., 8.]]
           result1 = fluid.layers.reverse(data, 0) # [[6., 7., 8.], [3., 4., 5.], [0., 1., 2.]]
           result2 = fluid.layers.reverse(data, [0, 1]) # [[8., 7., 6.], [5., 4., 3.], [2., 1., 0.]]
+
+          # example of LoDTensorArray
+          data1 = fluid.layers.assign(np.array([[0, 1, 2]], dtype='float32'))
+          data2 = fluid.layers.assign(np.array([[3, 4, 5]], dtype='float32'))
+          tensor_array = fluid.layers.create_array(dtype='float32')
+          i = fluid.layers.fill_constant(shape=[1], dtype='int64', value=0)
+          fluid.layers.array_write(data1, i, tensor_array)
+          fluid.layers.array_write(data2, i+1, tensor_array)
+
+          reversed_tensor_array = fluid.layers.reverse(tensor_array, 0) # {[[3, 4, 5]], [[0, 1, 2]]}
     """
     check_variable_and_dtype(
         x, 'x', ('float32', 'float64', 'int32', 'int64', 'uint8'), 'reverse')
diff --git a/python/paddle/fluid/tests/unittests/test_reverse_op.py b/python/paddle/fluid/tests/unittests/test_reverse_op.py
index 21d15b0571..5aaf0b85d5 100644
--- a/python/paddle/fluid/tests/unittests/test_reverse_op.py
+++ b/python/paddle/fluid/tests/unittests/test_reverse_op.py
@@ -110,5 +110,76 @@ class TestCase4(unittest.TestCase):
         self.assertRaises(core.EnforceNotMet, _run_program)
 
 
+class TestReverseLoDTensorArray(unittest.TestCase):
+    def setUp(self):
+        self.shapes = [[5, 25], [5, 20], [5, 5]]
+        self.place = fluid.CUDAPlace(0) if fluid.is_compiled_with_cuda(
+        ) else fluid.CPUPlace()
+        self.exe = fluid.Executor(self.place)
+
+    def run_program(self, arr_len, axis=0):
+        main_program = fluid.Program()
+
+        with fluid.program_guard(main_program):
+            inputs, inputs_data = [], []
+            for i in range(arr_len):
+                x = fluid.data("x%s" % i, self.shapes[i], dtype='float32')
+                x.stop_gradient = False
+                inputs.append(x)
+                inputs_data.append(
+                    np.random.random(self.shapes[i]).astype('float32'))
+
+            tensor_array = fluid.layers.create_array(dtype='float32')
+            for i in range(arr_len):
+                idx = fluid.layers.array_length(tensor_array)
+                fluid.layers.array_write(inputs[i], idx, tensor_array)
+
+            reverse_array = fluid.layers.reverse(tensor_array, axis=axis)
+            output, _ = fluid.layers.tensor_array_to_tensor(reverse_array)
+            loss = fluid.layers.reduce_sum(output)
+            fluid.backward.append_backward(loss)
+            input_grads = list(
+                map(main_program.global_block().var,
+                    [x.name + "@GRAD" for x in inputs]))
+
+            feed_dict = dict(zip([x.name for x in inputs], inputs_data))
+            res = self.exe.run(main_program,
+                               feed=feed_dict,
+                               fetch_list=input_grads + [output.name])
+
+            return np.hstack(inputs_data[::-1]), res
+
+    def test_case1(self):
+        gt, res = self.run_program(arr_len=3)
+        self.check_output(gt, res)
+        # test with tuple type of axis
+        gt, res = self.run_program(arr_len=3, axis=(0, ))
+        self.check_output(gt, res)
+
+    def test_case2(self):
+        gt, res = self.run_program(arr_len=1)
+        self.check_output(gt, res)
+        # test with list type of axis
+        gt, res = self.run_program(arr_len=1, axis=[0])
+        self.check_output(gt, res)
+
+    def check_output(self, gt, res):
+        arr_len = len(res) - 1
+        reversed_array = res[-1]
+        # check output
+        self.assertTrue(np.array_equal(gt, reversed_array))
+        # check grad
+        for i in range(arr_len):
+            self.assertTrue(np.array_equal(res[i], np.ones_like(res[i])))
+
+    def test_raise_error(self):
+        # The len(axis) should be 1 is input(X) is LoDTensorArray
+        with self.assertRaises(Exception):
+            self.run_program(arr_len=3, axis=[0, 1])
+        # The value of axis should be 0 is input(X) is LoDTensorArray
+        with self.assertRaises(Exception):
+            self.run_program(arr_len=3, axis=1)
+
+
 if __name__ == '__main__':
     unittest.main()
-- 
GitLab