youtube_vis.py 2.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566
  1. dataset_type = 'YouTubeVISDataset'
  2. data_root = 'data/youtube_vis_2019/'
  3. dataset_version = data_root[-5:-1] # 2019 or 2021
  4. backend_args = None
  5. # dataset settings
  6. train_pipeline = [
  7. dict(
  8. type='UniformRefFrameSample',
  9. num_ref_imgs=1,
  10. frame_range=100,
  11. filter_key_img=True),
  12. dict(
  13. type='TransformBroadcaster',
  14. share_random_params=True,
  15. transforms=[
  16. dict(type='LoadImageFromFile', backend_args=backend_args),
  17. dict(type='LoadTrackAnnotations', with_mask=True),
  18. dict(type='Resize', scale=(640, 360), keep_ratio=True),
  19. dict(type='RandomFlip', prob=0.5),
  20. ]),
  21. dict(type='PackTrackInputs')
  22. ]
  23. test_pipeline = [
  24. dict(
  25. type='TransformBroadcaster',
  26. transforms=[
  27. dict(type='LoadImageFromFile', backend_args=backend_args),
  28. dict(type='Resize', scale=(640, 360), keep_ratio=True),
  29. dict(type='LoadTrackAnnotations', with_mask=True),
  30. ]),
  31. dict(type='PackTrackInputs')
  32. ]
  33. # dataloader
  34. train_dataloader = dict(
  35. batch_size=2,
  36. num_workers=2,
  37. persistent_workers=True,
  38. # sampler=dict(type='TrackImgSampler'), # image-based sampling
  39. sampler=dict(type='DefaultSampler', shuffle=True),
  40. batch_sampler=dict(type='TrackAspectRatioBatchSampler'),
  41. dataset=dict(
  42. type=dataset_type,
  43. data_root=data_root,
  44. dataset_version=dataset_version,
  45. ann_file='annotations/youtube_vis_2019_train.json',
  46. data_prefix=dict(img_path='train/JPEGImages'),
  47. pipeline=train_pipeline))
  48. val_dataloader = dict(
  49. batch_size=1,
  50. num_workers=2,
  51. persistent_workers=True,
  52. drop_last=False,
  53. sampler=dict(type='DefaultSampler', shuffle=False, round_up=False),
  54. dataset=dict(
  55. type=dataset_type,
  56. data_root=data_root,
  57. dataset_version=dataset_version,
  58. ann_file='annotations/youtube_vis_2019_valid.json',
  59. data_prefix=dict(img_path='valid/JPEGImages'),
  60. test_mode=True,
  61. pipeline=test_pipeline))
  62. test_dataloader = val_dataloader