Add docstring for FP16 part

2cdc9036 · linjintao · 7adb6410 · 2cdc9036 · 2cdc9036 · 2cdc9036
Showing with 74 addition and 30 deletion

mmaction/core/fp16/decorators.py mmaction/core/fp16/decorators.py +34 -30

mmaction/core/fp16/hooks.py mmaction/core/fp16/hooks.py +30 -0

mmaction/core/fp16/utils.py mmaction/core/fp16/utils.py +10 -0

未找到文件。
--- a/mmaction/core/fp16/decorators.py
+++ b/mmaction/core/fp16/decorators.py
@@ -19,21 +19,23 @@ def auto_fp16(apply_to=None, out_fp32=False):
            `None` indicates all arguments.
        out_fp32 (bool): Whether to convert the output back to fp32.

-    :Example:
-
-        class MyModule1(nn.Module)
-
-            # Convert x and y to fp16
-            @auto_fp16()
-            def forward(self, x, y):
-                pass
-
-        class MyModule2(nn.Module):
-
-            # convert pred to fp16
-            @auto_fp16(apply_to=('pred', ))
-            def do_something(self, pred, others):
-                pass
+    Example:
+
+        >>> import torch.nn as nn
+        >>> class MyModule1(nn.Module):
+        >>>
+        >>>     # Convert x and y to fp16
+        >>>     @auto_fp16()
+        >>>     def forward(self, x, y):
+        >>>         pass
+
+        >>> import torch.nn as nn
+        >>> class MyModule2(nn.Module):
+        >>>
+        >>>     # convert pred to fp16
+        >>>     @auto_fp16(apply_to=('pred', ))
+        >>>     def do_something(self, pred, others):
+        >>>         pass
    """

    def auto_fp16_wrapper(old_func):
@@ -97,21 +99,23 @@ def force_fp32(apply_to=None, out_fp16=False):
            `None` indicates all arguments.
        out_fp16 (bool): Whether to convert the output back to fp16.

-    :Example:
-
-        class MyModule1(nn.Module)
-
-            # Convert x and y to fp32
-            @force_fp32()
-            def loss(self, x, y):
-                pass
-
-        class MyModule2(nn.Module):
-
-            # convert pred to fp32
-            @force_fp32(apply_to=('pred', ))
-            def post_process(self, pred, others):
-                pass
+    Example:
+
+        >>> import torch.nn as nn
+        >>> class MyModule1(nn.Module):
+        >>>
+        >>>     # Convert x and y to fp32
+        >>>     @force_fp32()
+        >>>     def loss(self, x, y):
+        >>>         pass
+
+        >>> import torch.nn as nn
+        >>> class MyModule2(nn.Module):
+        >>>
+        >>>     # convert pred to fp32
+        >>>     @force_fp32(apply_to=('pred', ))
+        >>>     def post_process(self, pred, others):
+        >>>         pass
    """

    def force_fp32_wrapper(old_func):

--- a/mmaction/core/fp16/hooks.py
+++ b/mmaction/core/fp16/hooks.py
@@ -38,6 +38,11 @@ class Fp16OptimizerHook(OptimizerHook):
        self.distributed = distributed

    def before_run(self, runner):
+        """Preparing steps before Mixed Precision Training.
+
+        1. Make a master copy of fp32 weights for optimization.
+        2. Convert the main model from fp32 to fp16.
+        """
        # keep a copy of fp32 weights
        runner.optimizer.param_groups = copy.deepcopy(
            runner.optimizer.param_groups)
@@ -58,6 +63,14 @@ class Fp16OptimizerHook(OptimizerHook):
            fp16_param.data.copy_(fp32_param.data)

    def after_train_iter(self, runner):
+        """Backward optimization steps for Mixed Precision Training.
+
+        1. Scale the loss by a scale factor.
+        2. Backward the loss to obtain the gradients (fp16).
+        3. Copy gradients from the model to the fp32 weight copy.
+        4. Scale the gradients back and update the fp32 weight copy.
+        5. Copy back the params from fp32 weight copy to the fp16 model.
+        """
        # clear grads of last iteration
        runner.model.zero_grad()
        runner.optimizer.zero_grad()
@@ -85,6 +98,14 @@ class Fp16OptimizerHook(OptimizerHook):


 def wrap_fp16_model(model):
+    """Wrap the FP32 model to FP16.
+
+    1. Convert FP32 model to FP16.
+    2. Remain some necessary layers to be FP32, e.g., normalization layers.
+
+    Args:
+        model (nn.Module): Model in FP32.
+    """
    # convert model to fp16
    model.half()
    # patch the normalization layers to make it work in fp32 mode
@@ -96,6 +117,15 @@ def wrap_fp16_model(model):


 def patch_norm_fp32(module):
+    """Recursively convert normalization layers from FP16 to FP32.
+
+    Args:
+        module (nn.Module): The modules to be converted in FP16.
+
+    Returns:
+        nn.Module: The converted module, the normalization layers have been
+            converted to FP32.
+    """
    if isinstance(module, (_BatchNorm, nn.GroupNorm)):
        module.float()
        module.forward = patch_forward_method(module.forward, torch.half,

--- a/mmaction/core/fp16/utils.py
+++ b/mmaction/core/fp16/utils.py
@@ -5,6 +5,16 @@ import torch


 def cast_tensor_type(inputs, src_type, dst_type):
+    """Recursively convert Tensor in inputs from src_type to dst_type.
+
+    Args:
+        inputs: Inputs that to be casted.
+        src_type (torch.dtype): Source type..
+        dst_type (torch.dtype): Destination type.
+
+    Returns:
+        The same type with inputs, but all contained Tensors have been cast.
+    """
    if isinstance(inputs, torch.Tensor):
        return inputs.to(dst_type)
    elif isinstance(inputs, str):