download_and_convert_voc2012.py 2.5 KB
Newer Older
W
wuyefeilin 已提交
1 2
# coding: utf8
# Copyright (c) 2019 PaddlePaddle Authors. All Rights Reserve.
3
#
W
wuyefeilin 已提交
4
# Licensed under the Apache License, Version 2.0 (the "License");
5 6 7
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
W
wuyefeilin 已提交
8
#    http://www.apache.org/licenses/LICENSE-2.0
9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import sys
import os
import numpy as np
import os
import glob

LOCAL_PATH = os.path.dirname(os.path.abspath(__file__))
TEST_PATH = os.path.join(LOCAL_PATH, "..", "test")
sys.path.append(TEST_PATH)

from test_utils import download_file_and_uncompress
from convert_voc2012 import convert_list
from convert_voc2012 import remove_colormap
from convert_voc2012 import save_annotation


L
LutaoChu 已提交
32
def download_VOC_dataset(savepath, extrapath):
33 34 35 36
    url = "https://paddleseg.bj.bcebos.com/dataset/VOCtrainval_11-May-2012.tar"
    download_file_and_uncompress(
        url=url, savepath=savepath, extrapath=extrapath)

W
wuyefeilin 已提交
37

38
if __name__ == "__main__":
L
LutaoChu 已提交
39
    download_VOC_dataset(LOCAL_PATH, LOCAL_PATH)
40 41 42 43 44 45 46 47 48
    print("Dataset download finish!")

    pascal_root = "./VOCtrainval_11-May-2012/VOC2012"
    pascal_root = os.path.join(LOCAL_PATH, pascal_root)
    seg_folder = os.path.join(pascal_root, "SegmentationClass")
    txt_folder = os.path.join(pascal_root, "ImageSets/Segmentation")
    train_path = os.path.join(txt_folder, "train.txt")
    val_path = os.path.join(txt_folder, "val.txt")
    trainval_path = os.path.join(txt_folder, "trainval.txt")
W
wuyefeilin 已提交
49

50 51
    # 标注图转换后存储目录
    output_folder = os.path.join(pascal_root, "SegmentationClassAug")
W
wuyefeilin 已提交
52

53 54 55 56 57 58 59 60 61 62 63 64
    print("annotation convert and file list convert")
    if not os.path.exists(output_folder):
        os.mkdir(output_folder)
    annotation_names = glob.glob(os.path.join(seg_folder, '*.png'))
    for annotation_name in annotation_names:
        annotation = remove_colormap(annotation_name)
        filename = os.path.basename(annotation_name)
        save_name = os.path.join(output_folder, filename)
        save_annotation(annotation, save_name)

    convert_list(train_path, train_path.replace('txt', 'list'), output_folder)
    convert_list(val_path, val_path.replace('txt', 'list'), output_folder)
W
wuyefeilin 已提交
65 66
    convert_list(trainval_path, trainval_path.replace('txt', 'list'),
                 output_folder)