From 758c84a1e6b41e1281d5cbf88b80fc5d784683e6 Mon Sep 17 00:00:00 2001 From: jerrywgz Date: Tue, 25 Jun 2019 09:37:45 +0800 Subject: [PATCH] add mask_rcnn_se154_fpn_s1x in object detection (#2514) --- .../configs/mask_rcnn_se154_fpn_s1x.yml | 156 ++++++++++++++++++ 1 file changed, 156 insertions(+) create mode 100644 PaddleCV/object_detection/configs/mask_rcnn_se154_fpn_s1x.yml diff --git a/PaddleCV/object_detection/configs/mask_rcnn_se154_fpn_s1x.yml b/PaddleCV/object_detection/configs/mask_rcnn_se154_fpn_s1x.yml new file mode 100644 index 00000000..c71c39b2 --- /dev/null +++ b/PaddleCV/object_detection/configs/mask_rcnn_se154_fpn_s1x.yml @@ -0,0 +1,156 @@ +architecture: MaskRCNN +train_feed: MaskRCNNTrainFeed +eval_feed: MaskRCNNEvalFeed +test_feed: MaskRCNNTestFeed +max_iters: 260000 +snapshot_iter: 10000 +use_gpu: True +log_smooth_window: 20 +save_dir: output +pretrain_weights: https://paddle-imagenet-models-name.bj.bcebos.com/SE154_vd_pretrained.tar +weights: output/mask_rcnn_se154_fpn_s1x/model_final/ +metric: COCO + +MaskRCNN: + backbone: SENet + fpn: FPN + rpn_head: FPNRPNHead + roi_extractor: FPNRoIAlign + bbox_head: BBoxHead + bbox_assigner: BBoxAssigner + +SENet: + depth: 152 + feature_maps: [2, 3, 4, 5] + freeze_at: 2 + group_width: 4 + groups: 64 + norm_type: affine_channel + variant: d + +FPN: + max_level: 6 + min_level: 2 + num_chan: 256 + spatial_scale: [0.03125, 0.0625, 0.125, 0.25] + +FPNRPNHead: + anchor_generator: + aspect_ratios: [0.5, 1.0, 2.0] + variance: [1.0, 1.0, 1.0, 1.0] + anchor_start_size: 32 + max_level: 6 + min_level: 2 + num_chan: 256 + rpn_target_assign: + rpn_batch_size_per_im: 256 + rpn_fg_fraction: 0.5 + rpn_negative_overlap: 0.3 + rpn_positive_overlap: 0.7 + rpn_straddle_thresh: 0.0 + train_proposal: + min_size: 0.0 + nms_thresh: 0.7 + post_nms_top_n: 2000 + pre_nms_top_n: 2000 + test_proposal: + min_size: 0.0 + nms_thresh: 0.7 + post_nms_top_n: 1000 + pre_nms_top_n: 1000 + +FPNRoIAlign: + canconical_level: 4 + canonical_size: 224 + max_level: 5 + min_level: 2 + box_resolution: 7 + sampling_ratio: 2 + mask_resolution: 14 + +MaskHead: + dilation: 1 + num_chan_reduced: 256 + num_classes: 81 + num_convs: 4 + resolution: 28 + +BBoxAssigner: + batch_size_per_im: 512 + bbox_reg_weights: [0.1, 0.1, 0.2, 0.2] + bg_thresh_hi: 0.5 + bg_thresh_lo: 0.0 + fg_fraction: 0.25 + fg_thresh: 0.5 + num_classes: 81 + +MaskAssigner: + resolution: 28 + +BBoxHead: + head: TwoFCHead + nms: + keep_top_k: 100 + nms_threshold: 0.5 + score_threshold: 0.05 + num_classes: 81 + +TwoFCHead: + num_chan: 1024 + +LearningRate: + base_lr: 0.01 + schedulers: + - !PiecewiseDecay + gamma: 0.1 + milestones: [200000, 240000] + values: null + - !LinearWarmup + start_factor: 0.3333333333333333 + steps: 500 + +OptimizerBuilder: + optimizer: + momentum: 0.9 + type: Momentum + regularizer: + factor: 0.0001 + type: L2 + +MaskRCNNTrainFeed: + # batch size per device + batch_size: 1 + batch_transforms: + - !PadBatch + pad_to_stride: 32 + dataset: + dataset_dir: data/coco + image_dir: train2017 + annotation: annotations/instances_train2017.json + num_workers: 2 + shuffle: True + use_padded_im_info: False + +MaskRCNNEvalFeed: + batch_size: 1 + batch_transforms: + - !PadBatch + pad_to_stride: 32 + dataset: + dataset_dir: data/coco + annotation: annotations/instances_val2017.json + image_dir: val2017 + num_workers: 2 + use_padded_im_info: True + +MaskRCNNTestFeed: + batch_size: 1 + batch_transforms: + - !PadBatch + pad_to_stride: 32 + dataset: + dataset_dir: data/coco + annotation: annotations/instances_val2017.json + image_dir: val2017 + num_workers: 2 + use_padded_im_info: True -- GitLab