From f5f9249a161f5fadf47bd0a629780088b60ffecf Mon Sep 17 00:00:00 2001
From: Megvii Engine Team <megengine@megvii.com>
Date: Mon, 28 Feb 2022 13:57:07 +0800
Subject: [PATCH] docs(compose): update compose API docstring and example

GitOrigin-RevId: fd52df2c48d50749714ea909f0b53440c7965fca
---
 .../data/transform/vision/transform.py        | 84 +++++++++++++------
 1 file changed, 58 insertions(+), 26 deletions(-)

diff --git a/imperative/python/megengine/data/transform/vision/transform.py b/imperative/python/megengine/data/transform/vision/transform.py
index 2af7bfce7..ed2e6f9b1 100644
--- a/imperative/python/megengine/data/transform/vision/transform.py
+++ b/imperative/python/megengine/data/transform/vision/transform.py
@@ -8,7 +8,7 @@
 # "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 import collections.abc
 import math
-from typing import Sequence, Tuple
+from typing import List, Sequence, Tuple
 
 import cv2
 import numpy as np
@@ -52,7 +52,7 @@ class VisionTransform(Transform):
             order is used to specify the order of structures. For example, if your input
             is (image, boxes) type, then the ``order`` should be ("image", "boxes").
             Current available strings and data type are describe below:
-    
+
             * "image": input image, with shape of `(H, W, C)`.
             * "coords": coordinates, with shape of `(N, 2)`.
             * "boxes": bounding boxes, with shape of `(N, 4)`, "xyxy" format,
@@ -69,7 +69,7 @@ class VisionTransform(Transform):
               means category of the input image and "boxes_category" means categories of
               bounding boxes.
             * "info": information for images such as image shapes and image path.
-    
+
     You can also customize your data types only if you implement the corresponding
     _apply_*() methods, otherwise ``NotImplementedError`` will be raised.
     """
@@ -183,35 +183,67 @@ class ToMode(VisionTransform):
 
 
 class Compose(VisionTransform):
-    r"""Composes several transforms together.
+    r"""Composes several transfomations together.
 
     Args:
         transforms: list of :class:`VisionTransform` to compose.
-        batch_compose: whether use shuffle_indices for batch data or not.
-            If True, use original input sequence.
-            Otherwise, the shuffle_indices will be used for transforms.
+        batch_compose: whether keep the same transform order in batch data when shuffle.
         shuffle_indices: indices used for random shuffle, start at 1.
-            For example, if shuffle_indices is [(1, 3), (2, 4)], then the 1st and 3rd transform
-            will be random shuffled, the 2nd and 4th transform will also be shuffled.
         order: the same with :class:`VisionTransform`
-    
+
+    .. seealso:: Refer to :mod:`~.data.transform` module for vision transform APIs.
+
     Examples:
-        .. testcode::
-        
-           from megengine.data.transform import RandomHorizontalFlip, RandomVerticalFlip, CenterCrop, ToMode, Compose
-           
-           transform_func = Compose([
-           RandomHorizontalFlip(),
-           RandomVerticalFlip(),
-           CenterCrop(100),
-           ToMode("CHW"),
-           ],
-           shuffle_indices=[(1, 2, 3)]
-           )
+
+        >>> import megengine.data.transform as T
+        >>> T.Compose([  # doctest: +SKIP
+        ...     T.RandomHorizontalFlip(),  # 1st
+        ...     T.RandomVerticalFlip(),    # 2nd
+        ...     T.CenterCrop(100),         # 3rd
+        ...     T.ToMode("CHW"),           # 4th
+        ...     ],
+        ...     shuffle_indices=[(1, 2, 3)]
+        ... )
+
+        In this case, ``shuffle_indices`` is given so each input data will be transformed
+        out of order:
+
+        .. math::
+
+           \begin{array}{cc}
+           [{\color{red}1 \quad 2 \quad 3} \quad 4] & [{\color{red}1 \quad 3 \quad 2} \quad 4] \\
+           [{\color{red}2 \quad 1 \quad 3} \quad 4] & [{\color{red}2 \quad 3 \quad 1} \quad 4] \\
+           [{\color{red}3 \quad 1 \quad 2} \quad 4] & [{\color{red}3 \quad 2 \quad 1} \quad 4]
+           \end{array}
+
+        In another case, if ``[(1, 3), (2, 4)]`` is given, then the 1st and 3rd transfomation
+        will be random shuffled, the 2nd and 4th transfomation will also be shuffled:
+
+        .. math::
+
+           \begin{array}{cc}
+           [{\color{red}1} \quad {\color{blue}2} \quad {\color{red}3} \quad {\color{blue}4}] &
+           [{\color{red}1} \quad {\color{blue}4} \quad {\color{red}3} \quad {\color{blue}2}] \\
+           [{\color{red}3} \quad {\color{blue}2} \quad {\color{red}1} \quad {\color{blue}4}] &
+           [{\color{red}3} \quad {\color{blue}4} \quad {\color{red}1} \quad {\color{blue}2}]
+           \end{array}
+
+        Different colors represent different groups that need to be internally shuffled.
+
+        .. warning::
+
+           Different samples within each batch will also use random transfomation orders,
+           unless ``batch_compose`` is set to ``True``.
+
     """
 
     def __init__(
-        self, transforms=[], batch_compose=False, shuffle_indices=None, *, order=None
+        self,
+        transforms: List[VisionTransform] = [],
+        batch_compose: bool = False,
+        shuffle_indices: List[Tuple] = None,
+        *,
+        order=None
     ):
         super().__init__(order)
         self.transforms = transforms
@@ -354,7 +386,7 @@ class Resize(VisionTransform):
     Args:
         output_size: target size of image, with (height, width) shape.
         interpolation: interpolation method. All methods are listed below:
-    
+
             * cv2.INTER_NEAREST – a nearest-neighbor interpolation.
             * cv2.INTER_LINEAR – a bilinear interpolation (used by default).
             * cv2.INTER_AREA – resampling using pixel area relation.
@@ -1012,9 +1044,9 @@ class ColorJitter(VisionTransform):
 
 class Lighting(VisionTransform):
     r"""Apply AlexNet-Style "lighting" augmentation to input data.
-    
+
     Input images are assumed to have 'RGB' channel order.
-    
+
     The degree of color jittering is randomly sampled via a normal distribution,
     with standard deviation given by the scale parameter.
     """
-- 
GitLab