xdecoder-tiny_zeroshot_ref-caption.py 517 B

1234567891011121314151617
  1. _base_ = 'xdecoder-tiny_zeroshot_caption_coco2014.py'
  2. model = dict(head=dict(task='ref-caption'))
  3. grounding_scale = 512
  4. test_pipeline = [
  5. dict(type='LoadImageFromFile', imdecode_backend='pillow'),
  6. dict(type='ResizeShortestEdge', scale=224, backend='pillow'),
  7. dict(
  8. type='PackDetInputs',
  9. meta_keys=('img_id', 'img_path', 'ori_shape', 'img_shape',
  10. 'scale_factor', 'text'))
  11. ]
  12. val_dataloader = dict(dataset=dict(pipeline=test_pipeline))
  13. test_dataloader = val_dataloader