json_to_dataset.py 2.3 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576
  1. import argparse
  2. import json
  3. import os
  4. import os.path as osp
  5. import warnings
  6. import PIL.Image
  7. import yaml
  8. from labelme import utils
  9. def main():
  10. warnings.warn("This script is aimed to demonstrate how to convert the\n"
  11. "JSON file to a single image dataset, and not to handle\n"
  12. "multiple JSON files to generate a real-use dataset.")
  13. parser = argparse.ArgumentParser()
  14. parser.add_argument('json_file')
  15. parser.add_argument('-o', '--out', default=None)
  16. args = parser.parse_args()
  17. json_file = args.json_file
  18. if args.out is None:
  19. out_dir = osp.basename(json_file).replace('.', '_')
  20. out_dir = osp.join(osp.dirname(json_file), out_dir)
  21. else:
  22. out_dir = args.out
  23. if not osp.exists(out_dir):
  24. os.mkdir(out_dir)
  25. data = json.load(open(json_file))
  26. img = utils.img_b64_to_arr(data['imageData'])
  27. label_name_to_value = {'_background_': 0}
  28. for shape in data['shapes']:
  29. label_name = shape['label']
  30. if label_name in label_name_to_value:
  31. label_value = label_name_to_value[label_name]
  32. else:
  33. label_value = len(label_name_to_value)
  34. label_name_to_value[label_name] = label_value
  35. # label_values must be dense
  36. label_values, label_names = [], []
  37. for ln, lv in sorted(label_name_to_value.items(), key=lambda x: x[1]):
  38. label_values.append(lv)
  39. label_names.append(ln)
  40. assert label_values == list(range(len(label_values)))
  41. lbl = utils.shapes_to_label(img.shape, data['shapes'], label_name_to_value)
  42. captions = ['{}: {}'.format(lv, ln)
  43. for ln, lv in label_name_to_value.items()]
  44. lbl_viz = utils.draw_label(lbl, img, captions)
  45. PIL.Image.fromarray(img).save(osp.join(out_dir, 'img.png'))
  46. PIL.Image.fromarray(lbl).save(osp.join(out_dir, 'label.png'))
  47. PIL.Image.fromarray(lbl_viz).save(osp.join(out_dir, 'label_viz.png'))
  48. with open(osp.join(out_dir, 'label_names.txt'), 'w') as f:
  49. for lbl_name in label_names:
  50. f.write(lbl_name + '\n')
  51. warnings.warn('info.yaml is being replaced by label_names.txt')
  52. info = dict(label_names=label_names)
  53. with open(osp.join(out_dir, 'info.yaml'), 'w') as f:
  54. yaml.safe_dump(info, f, default_flow_style=False)
  55. print('Saved to: %s' % out_dir)
  56. if __name__ == '__main__':
  57. main()