darknet.py 7.9 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14
# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

Q
qingqing01 已提交
15 16 17 18 19 20 21
import paddle
import paddle.nn as nn
import paddle.nn.functional as F
from paddle import ParamAttr
from paddle.regularizer import L2Decay
from ppdet.core.workspace import register, serializable
from ppdet.modeling.ops import batch_norm
22
from ..shape_spec import ShapeSpec
Q
qingqing01 已提交
23 24 25 26 27 28 29 30 31 32 33 34 35

__all__ = ['DarkNet', 'ConvBNLayer']


class ConvBNLayer(nn.Layer):
    def __init__(self,
                 ch_in,
                 ch_out,
                 filter_size=3,
                 stride=1,
                 groups=1,
                 padding=0,
                 norm_type='bn',
F
Feng Ni 已提交
36
                 norm_decay=0.,
Q
qingqing01 已提交
37
                 act="leaky",
38 39
                 name=None,
                 data_format='NCHW'):
Q
qingqing01 已提交
40 41 42 43 44 45 46 47 48 49
        super(ConvBNLayer, self).__init__()

        self.conv = nn.Conv2D(
            in_channels=ch_in,
            out_channels=ch_out,
            kernel_size=filter_size,
            stride=stride,
            padding=padding,
            groups=groups,
            weight_attr=ParamAttr(name=name + '.conv.weights'),
50
            data_format=data_format,
Q
qingqing01 已提交
51
            bias_attr=False)
F
Feng Ni 已提交
52
        self.batch_norm = batch_norm(
53 54 55 56 57
            ch_out,
            norm_type=norm_type,
            norm_decay=norm_decay,
            name=name,
            data_format=data_format)
Q
qingqing01 已提交
58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75
        self.act = act

    def forward(self, inputs):
        out = self.conv(inputs)
        out = self.batch_norm(out)
        if self.act == 'leaky':
            out = F.leaky_relu(out, 0.1)
        return out


class DownSample(nn.Layer):
    def __init__(self,
                 ch_in,
                 ch_out,
                 filter_size=3,
                 stride=2,
                 padding=1,
                 norm_type='bn',
F
Feng Ni 已提交
76
                 norm_decay=0.,
77 78
                 name=None,
                 data_format='NCHW'):
Q
qingqing01 已提交
79 80 81 82 83 84 85 86 87 88

        super(DownSample, self).__init__()

        self.conv_bn_layer = ConvBNLayer(
            ch_in=ch_in,
            ch_out=ch_out,
            filter_size=filter_size,
            stride=stride,
            padding=padding,
            norm_type=norm_type,
F
Feng Ni 已提交
89
            norm_decay=norm_decay,
90
            data_format=data_format,
Q
qingqing01 已提交
91 92 93 94 95 96 97 98 99
            name=name)
        self.ch_out = ch_out

    def forward(self, inputs):
        out = self.conv_bn_layer(inputs)
        return out


class BasicBlock(nn.Layer):
100 101 102 103 104 105 106
    def __init__(self,
                 ch_in,
                 ch_out,
                 norm_type='bn',
                 norm_decay=0.,
                 name=None,
                 data_format='NCHW'):
Q
qingqing01 已提交
107 108 109 110 111 112 113 114 115
        super(BasicBlock, self).__init__()

        self.conv1 = ConvBNLayer(
            ch_in=ch_in,
            ch_out=ch_out,
            filter_size=1,
            stride=1,
            padding=0,
            norm_type=norm_type,
F
Feng Ni 已提交
116
            norm_decay=norm_decay,
117
            data_format=data_format,
Q
qingqing01 已提交
118 119 120 121 122 123 124 125
            name=name + '.0')
        self.conv2 = ConvBNLayer(
            ch_in=ch_out,
            ch_out=ch_out * 2,
            filter_size=3,
            stride=1,
            padding=1,
            norm_type=norm_type,
F
Feng Ni 已提交
126
            norm_decay=norm_decay,
127
            data_format=data_format,
Q
qingqing01 已提交
128 129 130 131 132 133 134 135 136 137
            name=name + '.1')

    def forward(self, inputs):
        conv1 = self.conv1(inputs)
        conv2 = self.conv2(conv1)
        out = paddle.add(x=inputs, y=conv2)
        return out


class Blocks(nn.Layer):
F
Feng Ni 已提交
138 139 140 141 142 143
    def __init__(self,
                 ch_in,
                 ch_out,
                 count,
                 norm_type='bn',
                 norm_decay=0.,
144 145
                 name=None,
                 data_format='NCHW'):
Q
qingqing01 已提交
146 147 148
        super(Blocks, self).__init__()

        self.basicblock0 = BasicBlock(
F
Feng Ni 已提交
149 150 151 152
            ch_in,
            ch_out,
            norm_type=norm_type,
            norm_decay=norm_decay,
153
            data_format=data_format,
F
Feng Ni 已提交
154
            name=name + '.0')
Q
qingqing01 已提交
155 156 157 158 159 160
        self.res_out_list = []
        for i in range(1, count):
            block_name = '{}.{}'.format(name, i)
            res_out = self.add_sublayer(
                block_name,
                BasicBlock(
F
Feng Ni 已提交
161 162 163 164
                    ch_out * 2,
                    ch_out,
                    norm_type=norm_type,
                    norm_decay=norm_decay,
165
                    data_format=data_format,
F
Feng Ni 已提交
166
                    name=block_name))
Q
qingqing01 已提交
167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182
            self.res_out_list.append(res_out)
        self.ch_out = ch_out

    def forward(self, inputs):
        y = self.basicblock0(inputs)
        for basic_block_i in self.res_out_list:
            y = basic_block_i(y)
        return y


DarkNet_cfg = {53: ([1, 2, 8, 8, 4])}


@register
@serializable
class DarkNet(nn.Layer):
183
    __shared__ = ['norm_type', 'data_format']
Q
qingqing01 已提交
184 185 186 187 188 189

    def __init__(self,
                 depth=53,
                 freeze_at=-1,
                 return_idx=[2, 3, 4],
                 num_stages=5,
F
Feng Ni 已提交
190
                 norm_type='bn',
191 192
                 norm_decay=0.,
                 data_format='NCHW'):
Q
qingqing01 已提交
193 194 195 196 197 198 199 200 201 202 203 204 205 206
        super(DarkNet, self).__init__()
        self.depth = depth
        self.freeze_at = freeze_at
        self.return_idx = return_idx
        self.num_stages = num_stages
        self.stages = DarkNet_cfg[self.depth][0:num_stages]

        self.conv0 = ConvBNLayer(
            ch_in=3,
            ch_out=32,
            filter_size=3,
            stride=1,
            padding=1,
            norm_type=norm_type,
F
Feng Ni 已提交
207
            norm_decay=norm_decay,
208
            data_format=data_format,
Q
qingqing01 已提交
209 210 211 212 213 214
            name='yolo_input')

        self.downsample0 = DownSample(
            ch_in=32,
            ch_out=32 * 2,
            norm_type=norm_type,
F
Feng Ni 已提交
215
            norm_decay=norm_decay,
216
            data_format=data_format,
Q
qingqing01 已提交
217 218
            name='yolo_input.downsample')

219
        self._out_channels = []
Q
qingqing01 已提交
220 221 222 223 224 225 226 227 228 229 230 231
        self.darknet_conv_block_list = []
        self.downsample_list = []
        ch_in = [64, 128, 256, 512, 1024]
        for i, stage in enumerate(self.stages):
            name = 'stage.{}'.format(i)
            conv_block = self.add_sublayer(
                name,
                Blocks(
                    int(ch_in[i]),
                    32 * (2**i),
                    stage,
                    norm_type=norm_type,
F
Feng Ni 已提交
232
                    norm_decay=norm_decay,
233
                    data_format=data_format,
Q
qingqing01 已提交
234 235
                    name=name))
            self.darknet_conv_block_list.append(conv_block)
236 237
            if i in return_idx:
                self._out_channels.append(64 * (2**i))
Q
qingqing01 已提交
238 239 240 241 242 243 244 245
        for i in range(num_stages - 1):
            down_name = 'stage.{}.downsample'.format(i)
            downsample = self.add_sublayer(
                down_name,
                DownSample(
                    ch_in=32 * (2**(i + 1)),
                    ch_out=32 * (2**(i + 2)),
                    norm_type=norm_type,
F
Feng Ni 已提交
246
                    norm_decay=norm_decay,
247
                    data_format=data_format,
Q
qingqing01 已提交
248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265
                    name=down_name))
            self.downsample_list.append(downsample)

    def forward(self, inputs):
        x = inputs['image']

        out = self.conv0(x)
        out = self.downsample0(out)
        blocks = []
        for i, conv_block_i in enumerate(self.darknet_conv_block_list):
            out = conv_block_i(out)
            if i == self.freeze_at:
                out.stop_gradient = True
            if i in self.return_idx:
                blocks.append(out)
            if i < self.num_stages - 1:
                out = self.downsample_list[i](out)
        return blocks
266 267 268 269

    @property
    def out_shape(self):
        return [ShapeSpec(channels=c) for c in self._out_channels]