labelme2voc.py 3.3 KB
Newer Older
1 2 3 4 5 6 7 8
#!/usr/bin/env python

from __future__ import print_function

import argparse
import glob
import os
import os.path as osp
K
Kentaro Wada 已提交
9
import sys
10

11
import imgviz
12 13 14 15 16 17 18
import numpy as np

import labelme


def main():
    parser = argparse.ArgumentParser(
19 20 21 22
        formatter_class=argparse.ArgumentDefaultsHelpFormatter
    )
    parser.add_argument('input_dir', help='input annotated directory')
    parser.add_argument('output_dir', help='output dataset directory')
K
Kentaro Wada 已提交
23
    parser.add_argument('--labels', help='labels file', required=True)
24 25 26
    parser.add_argument(
        '--noviz', help='no visualization', action='store_true'
    )
27 28
    args = parser.parse_args()

29 30 31 32 33 34 35
    if osp.exists(args.output_dir):
        print('Output directory already exists:', args.output_dir)
        sys.exit(1)
    os.makedirs(args.output_dir)
    os.makedirs(osp.join(args.output_dir, 'JPEGImages'))
    os.makedirs(osp.join(args.output_dir, 'SegmentationClass'))
    os.makedirs(osp.join(args.output_dir, 'SegmentationClassPNG'))
36 37 38 39
    if not args.noviz:
        os.makedirs(
            osp.join(args.output_dir, 'SegmentationClassVisualization')
        )
40
    print('Creating dataset:', args.output_dir)
41 42 43

    class_names = []
    class_name_to_id = {}
44
    for i, line in enumerate(open(args.labels).readlines()):
45 46 47 48 49 50 51 52 53 54 55
        class_id = i - 1  # starts with -1
        class_name = line.strip()
        class_name_to_id[class_name] = class_id
        if class_id == -1:
            assert class_name == '__ignore__'
            continue
        elif class_id == 0:
            assert class_name == '_background_'
        class_names.append(class_name)
    class_names = tuple(class_names)
    print('class_names:', class_names)
56
    out_class_names_file = osp.join(args.output_dir, 'class_names.txt')
57 58 59 60
    with open(out_class_names_file, 'w') as f:
        f.writelines('\n'.join(class_names))
    print('Saved class_names:', out_class_names_file)

61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77
    for filename in glob.glob(osp.join(args.input_dir, '*.json')):
        print('Generating dataset from:', filename)

        label_file = labelme.LabelFile(filename=filename)

        base = osp.splitext(osp.basename(filename))[0]
        out_img_file = osp.join(
            args.output_dir, 'JPEGImages', base + '.jpg')
        out_lbl_file = osp.join(
            args.output_dir, 'SegmentationClass', base + '.npy')
        out_png_file = osp.join(
            args.output_dir, 'SegmentationClassPNG', base + '.png')
        if not args.noviz:
            out_viz_file = osp.join(
                args.output_dir,
                'SegmentationClassVisualization',
                base + '.jpg',
78
            )
79 80 81 82 83

        with open(out_img_file, 'wb') as f:
            f.write(label_file.imageData)
        img = labelme.utils.img_data_to_arr(label_file.imageData)

84
        lbl, _ = labelme.utils.shapes_to_label(
85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101
            img_shape=img.shape,
            shapes=label_file.shapes,
            label_name_to_value=class_name_to_id,
        )
        labelme.utils.lblsave(out_png_file, lbl)

        np.save(out_lbl_file, lbl)

        if not args.noviz:
            viz = imgviz.label2rgb(
                label=lbl,
                img=imgviz.rgb2gray(img),
                font_size=15,
                label_names=class_names,
                loc='rb',
            )
            imgviz.io.imsave(out_viz_file, viz)
102 103 104 105


if __name__ == '__main__':
    main()