xdecoder-tiny_zeroshot_text-image-retrieval.py 632 B

123456789101112131415161718192021222324
  1. _base_ = 'xdecoder-tiny_zeroshot_caption_coco2014.py'
  2. model = dict(head=dict(task='retrieval'))
  3. grounding_scale = 512
  4. test_pipeline = [
  5. dict(
  6. type='LoadImageFromFile',
  7. imdecode_backend='pillow',
  8. backend_args=_base_.backend_args),
  9. dict(
  10. type='ResizeShortestEdge',
  11. scale=224,
  12. backend='pillow',
  13. interpolation='bicubic'),
  14. dict(
  15. type='PackDetInputs',
  16. meta_keys=('img_id', 'img_path', 'ori_shape', 'img_shape',
  17. 'scale_factor', 'text'))
  18. ]
  19. val_dataloader = dict(dataset=dict(pipeline=test_pipeline))
  20. test_dataloader = val_dataloader