[AutoParallel] fix converter when sliced_shape is 1 (#41103)

* fix converter when sliced_shape is 1 * update unittest

[AutoParallel] fix converter when sliced_shape is 1 (#41103)
* fix converter when sliced_shape is 1 * update unittest
59c4fdac · zhaoyingli · GitHub · a0e961c0 · 59c4fdac · 59c4fdac
3 changed file
--- a/python/paddle/distributed/auto_parallel/converter.py
+++ b/python/paddle/distributed/auto_parallel/converter.py
@@ -447,8 +447,8 @@ class Converter(object):
                slice_shape = shape
            else:
                slice_shape = shape // process_shape[dims_mapping[i]]
-            if shape == 1:
+            if slice_shape == 1:
-                index = 0
+                index = partition_index[i][0]
            else:
                index = (partition_index[i][0] + 1) // slice_shape
            sliced_index = sliced_index * (shape // slice_shape) + index

--- a/python/paddle/distributed/auto_parallel/utils.py
+++ b/python/paddle/distributed/auto_parallel/utils.py
@@ -943,8 +943,8 @@ def _get_sliced_param_index(rank, complete_shape, dims_mapping, process_shape,
            slice_shape = shape
        else:
            slice_shape = shape // process_shape[dims_mapping[i]]
-        if shape == 1:
+        if slice_shape == 1:
-            index = 0
+            index = partition_index[i][0]
        else:
            index = (partition_index[i][0] + 1) // slice_shape
        sliced_param_index = sliced_param_index * (shape // slice_shape) + index

--- a/python/paddle/fluid/tests/unittests/auto_parallel/converter.py
+++ b/python/paddle/fluid/tests/unittests/auto_parallel/converter.py
@@ -78,6 +78,28 @@ def test_convert():
    convert_tensor_dict = converter.convert(strict=False)
    assert np.equal(convert_tensor_dict[new_name], tensor_row[rank_id]).all()
+    # test sliced_shape is 1
+    complete_tensor = np.arange(4).reshape([2, 2])
+    tensor_row = np.split(complete_tensor, 2, axis=0)
+    complet_strategy = {
+        "tensor_2": {
+            "process_shape": [2],
+            "process_group": [0, 1],
+            "dims_mapping": [-1, -1]
+        }
+    }
+    row_strategy = {
+        "tensor_2": {
+            "process_shape": [2],
+            "process_group": [0, 1],
+            "dims_mapping": [0, -1]
+        }
+    }
+    tensor_dict = {"tensor_2": [complete_tensor]}
+    converter = Converter(tensor_dict, complet_strategy, row_strategy)
+    convert_tensor_dict = converter.convert()
+    assert np.equal(convert_tensor_dict["tensor_2"], tensor_row[rank_id]).all()
 if __name__ == "__main__":
    test_convert()