json_to_dataset.py 1.7 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758
  1. import argparse
  2. import json
  3. import os
  4. import os.path as osp
  5. import warnings
  6. import PIL.Image
  7. import yaml
  8. from labelme import utils
  9. def main():
  10. warnings.warn("This script is aimed to demonstrate how to convert the\n"
  11. "JSON file to a single image dataset, and not to handle\n"
  12. "multiple JSON files to generate a real-use dataset.")
  13. parser = argparse.ArgumentParser()
  14. parser.add_argument('json_file')
  15. parser.add_argument('-o', '--out', default=None)
  16. args = parser.parse_args()
  17. json_file = args.json_file
  18. if args.out is None:
  19. out_dir = osp.basename(json_file).replace('.', '_')
  20. out_dir = osp.join(osp.dirname(json_file), out_dir)
  21. else:
  22. out_dir = args.out
  23. if not osp.exists(out_dir):
  24. os.mkdir(out_dir)
  25. data = json.load(open(json_file))
  26. img = utils.img_b64_to_array(data['imageData'])
  27. lbl, lbl_names = utils.labelme_shapes_to_label(img.shape, data['shapes'])
  28. captions = ['%d: %s' % (l, name) for l, name in enumerate(lbl_names)]
  29. lbl_viz = utils.draw_label(lbl, img, captions)
  30. PIL.Image.fromarray(img).save(osp.join(out_dir, 'img.png'))
  31. PIL.Image.fromarray(lbl).save(osp.join(out_dir, 'label.png'))
  32. PIL.Image.fromarray(lbl_viz).save(osp.join(out_dir, 'label_viz.png'))
  33. with open(osp.join(out_dir, 'label_names.txt'), 'w') as f:
  34. for lbl_name in lbl_names:
  35. f.write(lbl_name + '\n')
  36. warnings.warn('info.yaml is being replaced by label_names.txt')
  37. info = dict(label_names=lbl_names)
  38. with open(osp.join(out_dir, 'info.yaml'), 'w') as f:
  39. yaml.safe_dump(info, f, default_flow_style=False)
  40. print('Saved to: %s' % out_dir)
  41. if __name__ == '__main__':
  42. main()