add doc

Signed-off-by: N lixuanyi <lixuanyi@sensetime.com>

add doc
Signed-off-by: N lixuanyi <lixuanyi@sensetime.com>
b42a5fad · lixuanyi · fc77dc36 · b42a5fad · b42a5fad
隐藏空白更改
内联并排

Showing with 65 addition and 2 deletion

mmaction/models/localizers/bmn.py mmaction/models/localizers/bmn.py +30 -2

mmaction/models/localizers/bsn.py mmaction/models/localizers/bsn.py +35 -0

未找到文件。
--- a/mmaction/models/localizers/bmn.py
+++ b/mmaction/models/localizers/bmn.py
@@ -131,6 +131,7 @@ class BMN(nn.Module):
        self.bm_mask = self._get_bm_mask()

    def _match_map(self):
+        """Generate match map."""
        temporal_gap = 1. / self.tscale
        match_map = []
        for idx in range(self.tscale):
@@ -146,6 +147,20 @@ class BMN(nn.Module):
        return match_map

    def _temporal_anchors(self, tmin_offset=0., tmax_offset=1.):
+        """Generate temporal anchors.
+
+        Args:
+            tmin_offset (int): Offset for the minimum value of temporal anchor.
+                Default: 0
+            tmax_offset (int): Offset for the maximun value of temporal anchor.
+                Default: 1
+
+        Returns:
+            anchors_tmins (Sequence[float]): The minimum values of temporal
+                anchors.
+            anchors_tmaxs (Sequence[float]): The maximum values of temporal
+                anchors.
+        """
        temporal_gap = 1. / self.tscale
        anchors_tmins = []
        anchors_tmaxs = []
@@ -156,6 +171,14 @@ class BMN(nn.Module):
        return anchors_tmins, anchors_tmaxs

    def _forward(self, x):
+        """Defines the computation performed at every call.
+
+        Args:
+            x (torch.Tensor): The input data.
+
+        Returns:
+            x (torch.Tensor): The output of the module.
+        """
        # x.shape [batch_size, self.feat_dim, self.tscale]
        base_feature = self.x_1d_b(x)
        # base_feature.shape [batch_size, self.hidden_dim_1d, self.tscale]
@@ -175,6 +198,7 @@ class BMN(nn.Module):
        return confidence_map, start, end

    def _boundary_matching_layer(self, x):
+        """Generate matching layer."""
        input_size = x.size()
        out = torch.matmul(x,
                           self.sample_mask).reshape(input_size[0],
@@ -184,6 +208,7 @@ class BMN(nn.Module):
        return out

    def forward_test(self, raw_feature, video_meta):
+        """Defines the computation performed at every call when testing."""
        confidence_map, start, end = self._forward(raw_feature)
        start_scores = start[0].cpu().numpy()
        end_scores = end[0].cpu().numpy()
@@ -245,6 +270,7 @@ class BMN(nn.Module):

    def forward_train(self, raw_feature, label_confidence, label_start,
                      label_end):
+        """Defines the computation performed at every call when training."""
        confidence_map, start, end = self._forward(raw_feature)
        loss = self.loss_cls(confidence_map, start, end, label_confidence,
                             label_start, label_end,
@@ -253,6 +279,7 @@ class BMN(nn.Module):
        return loss_dict

    def generate_labels(self, gt_bbox):
+        """Generate training labels."""
        match_score_confidence_list = []
        match_score_start_list = []
        match_score_end_list = []
@@ -320,7 +347,7 @@ class BMN(nn.Module):

    def _get_interp1d_bin_mask(self, seg_tmin, seg_tmax, tscale, num_samples,
                               num_samples_per_bin):
-        # generate sample mask for a boundary-matching pair
+        """Generate sample mask for a boundary-matching pair."""
        plen = float(seg_tmax - seg_tmin)
        plen_sample = plen / (num_samples * num_samples_per_bin - 1.0)
        total_samples = [
@@ -345,7 +372,7 @@ class BMN(nn.Module):
        return p_mask

    def _get_interp1d_mask(self):
-        # generate sample mask for each point in Boundary-Matching Map
+        """Generate sample mask for each point in Boundary-Matching Map."""
        mask_mat = []
        for start_index in range(self.tscale):
            mask_mat_vector = []
@@ -370,6 +397,7 @@ class BMN(nn.Module):
            torch.tensor(mask_mat).view(self.tscale, -1), requires_grad=False)

    def _get_bm_mask(self):
+        """Generate Boundary-Matching Mask."""
        bm_mask = []
        for idx in range(self.tscale):
            mask_vector = [1] * (self.tscale - idx) + [0] * idx

--- a/mmaction/models/localizers/bsn.py
+++ b/mmaction/models/localizers/bsn.py
@@ -77,6 +77,20 @@ class TEM(nn.Module):
        self.anchors_tmins, self.anchors_tmaxs = self._temporal_anchors()

    def _temporal_anchors(self, tmin_offset=0., tmax_offset=1.):
+        """Generate temporal anchors.
+
+        Args:
+            tmin_offset (int): Offset for the minimum value of temporal anchor.
+                Default: 0
+            tmax_offset (int): Offset for the maximun value of temporal anchor.
+                Default: 1
+
+        Returns:
+            anchors_tmins (Sequence[float]): The minimum values of temporal
+                anchors.
+            anchors_tmaxs (Sequence[float]): The maximum values of temporal
+                anchors.
+        """
        temporal_gap = 1. / self.temporal_dim
        anchors_tmins = []
        anchors_tmaxs = []
@@ -87,12 +101,21 @@ class TEM(nn.Module):
        return anchors_tmins, anchors_tmaxs

    def _forward(self, x):
+        """Defines the computation performed at every call.
+
+        Args:
+            x (torch.Tensor): The input data.
+
+        Returns:
+            x (torch.Tensor): The output of the module.
+        """
        x = F.relu(self.conv1_ratio * self.conv1(x))
        x = F.relu(self.conv2_ratio * self.conv2(x))
        x = torch.sigmoid(self.conv3_ratio * self.conv3(x))
        return x

    def forward_train(self, raw_feature, label_action, label_start, label_end):
+        """Defines the computation performed at every call when training."""
        tem_output = self._forward(raw_feature)
        score_action = tem_output[:, 0, :]
        score_start = tem_output[:, 1, :]
@@ -113,6 +136,7 @@ class TEM(nn.Module):
        return loss_dict

    def forward_test(self, raw_feature, video_meta):
+        """Defines the computation performed at every call when testing."""
        tem_output = self._forward(raw_feature).cpu().numpy()
        batch_action = tem_output[:, 0, :]
        batch_start = tem_output[:, 1, :]
@@ -133,6 +157,7 @@ class TEM(nn.Module):
        return video_results

    def generate_labels(self, gt_bbox):
+        """Generate training labels."""
        match_score_action_list = []
        match_score_start_list = []
        match_score_end_list = []
@@ -257,12 +282,21 @@ class PEM(nn.Module):
            bias=True)

    def _forward(self, x):
+        """Defines the computation performed at every call.
+
+        Args:
+            x (torch.Tensor): The input data.
+
+        Returns:
+            x (torch.Tensor): The output of the module.
+        """
        x = torch.cat([data for data in x])
        x = F.relu(self.fc1_ratio * self.fc1(x))
        x = torch.sigmoid(self.fc2_ratio * self.fc2(x))
        return x

    def forward_train(self, bsp_feature, reference_temporal_iou):
+        """Defines the computation performed at every call when training."""
        pem_output = self._forward(bsp_feature)
        reference_temporal_iou = torch.cat(
            [data for data in reference_temporal_iou])
@@ -307,6 +341,7 @@ class PEM(nn.Module):

    def forward_test(self, bsp_feature, tmin, tmax, tmin_score, tmax_score,
                     video_meta):
+        """Defines the computation performed at every call when testing."""
        pem_output = self._forward(bsp_feature).view(-1).cpu().numpy().reshape(
            -1, 1)