7 년 전 · f4dfc47a55
--- a/README.md
+++ b/README.md
@@ -31,6 +31,7 @@ It is written in Python and uses Qt for its graphical interface.
 
				 - [x] Video annotation. ([video annotation](examples/video_annotation))
			
 
				 - [x] GUI customization (predefined labels / flags, auto-saving, label validation, etc). ([#144](https://github.com/wkentaro/labelme/pull/144))
			
 
				 - [x] Exporting VOC-like dataset for semantic/instance segmentation. ([semantic segmentation](examples/semantic_segmentation), [instance segmentation](examples/instance_segmentation))
			
 
				+- [x] Exporting COCO-like dataset for instance segmentation. ([instance segmentation](examples/instance_segmentation))
			
 
				 
			
 
				 
			
 
				 
			
--- a/examples/instance_segmentation/README.md
+++ b/examples/instance_segmentation/README.md
@@ -34,3 +34,13 @@ labelme_draw_label_png data_dataset_voc/SegmentationObjectPNG/2011_000003.png  #
 
				 ```
			
 
				 
			
 
				 <img src=".readme/draw_label_png_class.jpg" width="33%" /> <img src=".readme/draw_label_png_object.jpg" width="33%" />
			
 
				+
			
 
				+
			
 
				+## Convert to COCO-like Dataset
			
 
				+
			
 
				+```bash
			
 
				+# It generates:
			
 
				+#   - data_dataset_coco/JPEGImages
			
 
				+#   - data_dataset_coco/annotations.json
			
 
				+./labelme2coco.py data_annotated data_dataset_coco --labels labels.txt
			
 
				+```
			
--- a/examples/instance_segmentation/data_dataset_coco/JPEGImages/2011_000003.jpg
+++ b/examples/instance_segmentation/data_dataset_coco/JPEGImages/2011_000003.jpg
--- a/examples/instance_segmentation/data_dataset_coco/JPEGImages/2011_000006.jpg
+++ b/examples/instance_segmentation/data_dataset_coco/JPEGImages/2011_000006.jpg
--- a/examples/instance_segmentation/data_dataset_coco/JPEGImages/2011_000025.jpg
+++ b/examples/instance_segmentation/data_dataset_coco/JPEGImages/2011_000025.jpg
--- a/examples/instance_segmentation/data_dataset_coco/annotations.json
+++ b/examples/instance_segmentation/data_dataset_coco/annotations.json
--- a/examples/instance_segmentation/labelme2coco.py
+++ b/examples/instance_segmentation/labelme2coco.py
@@ -0,0 +1,146 @@
 
				+#!/usr/bin/env python
			
 
				+
			
 
				+import argparse
			
 
				+import datetime
			
 
				+import glob
			
 
				+import json
			
 
				+import os
			
 
				+import os.path as osp
			
 
				+import sys
			
 
				+
			
 
				+import numpy as np
			
 
				+import PIL.Image
			
 
				+
			
 
				+import labelme
			
 
				+
			
 
				+try:
			
 
				+    import pycocotools.mask
			
 
				+except ImportError:
			
 
				+    print('Please install pycocotools:\n\n    pip install pycocotools\n')
			
 
				+    sys.exit(1)
			
 
				+
			
 
				+
			
 
				+def main():
			
 
				+    parser = argparse.ArgumentParser(
			
 
				+        formatter_class=argparse.ArgumentDefaultsHelpFormatter
			
 
				+    )
			
 
				+    parser.add_argument('input_dir', help='input annotated directory')
			
 
				+    parser.add_argument('output_dir', help='output dataset directory')
			
 
				+    parser.add_argument('--labels', help='labels file')
			
 
				+    args = parser.parse_args()
			
 
				+
			
 
				+    if osp.exists(args.output_dir):
			
 
				+        print('Output directory already exists:', args.output_dir)
			
 
				+        sys.exit(1)
			
 
				+    os.makedirs(args.output_dir)
			
 
				+    os.makedirs(osp.join(args.output_dir, 'JPEGImages'))
			
 
				+    print('Creating dataset:', args.output_dir)
			
 
				+
			
 
				+    now = datetime.datetime.now()
			
 
				+
			
 
				+    data = dict(
			
 
				+        info=dict(
			
 
				+            description=None,
			
 
				+            url=None,
			
 
				+            version=None,
			
 
				+            year=now.year,
			
 
				+            contributor=None,
			
 
				+            date_created=now.strftime('%Y-%m-%d %H:%M:%S.%f'),
			
 
				+        ),
			
 
				+        licenses=[dict(
			
 
				+            url=None,
			
 
				+            id=0,
			
 
				+            name=None,
			
 
				+        )],
			
 
				+        images=[
			
 
				+            # license, url, file_name, height, width, date_captured, id
			
 
				+        ],
			
 
				+        type='instances',
			
 
				+        annotations=[
			
 
				+            # segmentation, area, iscrowd, image_id, bbox, category_id, id
			
 
				+        ],
			
 
				+        categories=[
			
 
				+            # supercategory, id, name
			
 
				+        ],
			
 
				+    )
			
 
				+
			
 
				+    class_name_to_id = {}
			
 
				+    for i, line in enumerate(open(args.labels).readlines()):
			
 
				+        class_id = i - 1  # starts with -1
			
 
				+        class_name = line.strip()
			
 
				+        if class_id == -1:
			
 
				+            assert class_name == '__ignore__'
			
 
				+            continue
			
 
				+        elif class_id == 0:
			
 
				+            assert class_name == '_background_'
			
 
				+        class_name_to_id[class_name] = class_id
			
 
				+        data['categories'].append(dict(
			
 
				+            supercategory=None,
			
 
				+            id=class_id,
			
 
				+            name=class_name,
			
 
				+        ))
			
 
				+
			
 
				+    out_ann_file = osp.join(args.output_dir, 'annotations.json')
			
 
				+    label_files = glob.glob(osp.join(args.input_dir, '*.json'))
			
 
				+    for image_id, label_file in enumerate(label_files):
			
 
				+        print('Generating dataset from:', label_file)
			
 
				+        with open(label_file) as f:
			
 
				+            label_data = json.load(f)
			
 
				+
			
 
				+        base = osp.splitext(osp.basename(label_file))[0]
			
 
				+        out_img_file = osp.join(
			
 
				+            args.output_dir, 'JPEGImages', base + '.jpg'
			
 
				+        )
			
 
				+
			
 
				+        img_file = osp.join(
			
 
				+            osp.dirname(label_file), label_data['imagePath']
			
 
				+        )
			
 
				+        img = np.asarray(PIL.Image.open(img_file))
			
 
				+        PIL.Image.fromarray(img).save(out_img_file)
			
 
				+        data['images'].append(dict(
			
 
				+            license=0,
			
 
				+            url=None,
			
 
				+            file_name=osp.relpath(out_img_file, osp.dirname(out_ann_file)),
			
 
				+            height=img.shape[0],
			
 
				+            width=img.shape[1],
			
 
				+            date_captured=None,
			
 
				+            id=image_id,
			
 
				+        ))
			
 
				+
			
 
				+        masks = {}
			
 
				+        for shape in label_data['shapes']:
			
 
				+            points = shape['points']
			
 
				+            label = shape['label']
			
 
				+            shape_type = shape.get('shape_type', None)
			
 
				+            mask = labelme.utils.shape_to_mask(
			
 
				+                img.shape[:2], points, shape_type
			
 
				+            )
			
 
				+
			
 
				+            mask = np.asfortranarray(mask.astype(np.uint8))
			
 
				+            if label in masks:
			
 
				+                masks[label] = masks[label] | mask
			
 
				+            else:
			
 
				+                masks[label] = mask
			
 
				+
			
 
				+        for label, mask in masks.items():
			
 
				+            cls_name = label.split('-')[0]
			
 
				+            if cls_name not in class_name_to_id:
			
 
				+                continue
			
 
				+            cls_id = class_name_to_id[cls_name]
			
 
				+            segmentation = pycocotools.mask.encode(mask)
			
 
				+            segmentation['counts'] = segmentation['counts'].decode()
			
 
				+            area = float(pycocotools.mask.area(segmentation))
			
 
				+            data['annotations'].append(dict(
			
 
				+                segmentation=segmentation,
			
 
				+                area=area,
			
 
				+                iscrowd=None,
			
 
				+                image_id=image_id,
			
 
				+                category_id=cls_id,
			
 
				+            ))
			
 
				+
			
 
				+    with open(out_ann_file, 'w') as f:
			
 
				+        json.dump(data, f)
			
 
				+
			
 
				+
			
 
				+if __name__ == '__main__':
			
 
				+    main()