123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156 |
- #!/usr/bin/env python
- from __future__ import print_function
- import argparse
- import glob
- import os
- import os.path as osp
- import sys
- import imgviz
- import numpy as np
- import labelme
- def main():
- parser = argparse.ArgumentParser(
- formatter_class=argparse.ArgumentDefaultsHelpFormatter
- )
- parser.add_argument("input_dir", help="Input annotated directory")
- parser.add_argument("output_dir", help="Output dataset directory")
- parser.add_argument(
- "--labels", help="Labels file or comma separated text", required=True
- )
- parser.add_argument(
- "--noobject", help="Flag not to generate object label", action="store_true"
- )
- parser.add_argument(
- "--nonpy", help="Flag not to generate .npy files", action="store_true"
- )
- parser.add_argument(
- "--noviz", help="Flag to disable visualization", action="store_true"
- )
- args = parser.parse_args()
- if osp.exists(args.output_dir):
- print("Output directory already exists:", args.output_dir)
- sys.exit(1)
- os.makedirs(args.output_dir)
- os.makedirs(osp.join(args.output_dir, "JPEGImages"))
- os.makedirs(osp.join(args.output_dir, "SegmentationClass"))
- if not args.nonpy:
- os.makedirs(osp.join(args.output_dir, "SegmentationClassNpy"))
- if not args.noviz:
- os.makedirs(osp.join(args.output_dir, "SegmentationClassVisualization"))
- if not args.noobject:
- os.makedirs(osp.join(args.output_dir, "SegmentationObject"))
- if not args.nonpy:
- os.makedirs(osp.join(args.output_dir, "SegmentationObjectNpy"))
- if not args.noviz:
- os.makedirs(osp.join(args.output_dir, "SegmentationObjectVisualization"))
- print("Creating dataset:", args.output_dir)
- if osp.exists(args.labels):
- with open(args.labels) as f:
- labels = [label.strip() for label in f if label]
- else:
- labels = [label.strip() for label in args.labels.split(",")]
- class_names = []
- class_name_to_id = {}
- for i, label in enumerate(labels):
- class_id = i - 1 # starts with -1
- class_name = label.strip()
- class_name_to_id[class_name] = class_id
- if class_id == -1:
- assert class_name == "__ignore__"
- continue
- elif class_id == 0:
- assert class_name == "_background_"
- class_names.append(class_name)
- class_names = tuple(class_names)
- print("class_names:", class_names)
- out_class_names_file = osp.join(args.output_dir, "class_names.txt")
- with open(out_class_names_file, "w") as f:
- f.writelines("\n".join(class_names))
- print("Saved class_names:", out_class_names_file)
- for filename in sorted(glob.glob(osp.join(args.input_dir, "*.json"))):
- print("Generating dataset from:", filename)
- label_file = labelme.LabelFile(filename=filename)
- base = osp.splitext(osp.basename(filename))[0]
- out_img_file = osp.join(args.output_dir, "JPEGImages", base + ".jpg")
- out_clsp_file = osp.join(args.output_dir, "SegmentationClass", base + ".png")
- if not args.nonpy:
- out_cls_file = osp.join(
- args.output_dir, "SegmentationClassNpy", base + ".npy"
- )
- if not args.noviz:
- out_clsv_file = osp.join(
- args.output_dir,
- "SegmentationClassVisualization",
- base + ".jpg",
- )
- if not args.noobject:
- out_insp_file = osp.join(
- args.output_dir, "SegmentationObject", base + ".png"
- )
- if not args.nonpy:
- out_ins_file = osp.join(
- args.output_dir, "SegmentationObjectNpy", base + ".npy"
- )
- if not args.noviz:
- out_insv_file = osp.join(
- args.output_dir,
- "SegmentationObjectVisualization",
- base + ".jpg",
- )
- img = labelme.utils.img_data_to_arr(label_file.imageData)
- imgviz.io.imsave(out_img_file, img)
- cls, ins = labelme.utils.shapes_to_label(
- img_shape=img.shape,
- shapes=label_file.shapes,
- label_name_to_value=class_name_to_id,
- )
- ins[cls == -1] = 0 # ignore it.
- # class label
- labelme.utils.lblsave(out_clsp_file, cls)
- if not args.nonpy:
- np.save(out_cls_file, cls)
- if not args.noviz:
- clsv = imgviz.label2rgb(
- cls,
- imgviz.rgb2gray(img),
- label_names=class_names,
- font_size=15,
- loc="rb",
- )
- imgviz.io.imsave(out_clsv_file, clsv)
- if not args.noobject:
- # instance label
- labelme.utils.lblsave(out_insp_file, ins)
- if not args.nonpy:
- np.save(out_ins_file, ins)
- if not args.noviz:
- instance_ids = np.unique(ins)
- instance_names = [str(i) for i in range(max(instance_ids) + 1)]
- insv = imgviz.label2rgb(
- ins,
- imgviz.rgb2gray(img),
- label_names=instance_names,
- font_size=15,
- loc="rb",
- )
- imgviz.io.imsave(out_insv_file, insv)
- if __name__ == "__main__":
- main()
|