xdecoder-tiny_open-vocab-semseg.py 980 B

1234567891011121314151617181920212223242526272829
  1. _base_ = 'mmdet::_base_/default_runtime.py'
  2. custom_imports = dict(
  3. imports=['projects.XDecoder.xdecoder'], allow_failed_imports=False)
  4. model = dict(
  5. type='XDecoder',
  6. data_preprocessor=dict(
  7. type='DetDataPreprocessor',
  8. mean=[123.675, 116.28, 103.53],
  9. std=[58.395, 57.12, 57.375],
  10. bgr_to_rgb=True,
  11. pad_size_divisor=32),
  12. backbone=dict(type='FocalNet'),
  13. head=dict(
  14. type='XDecoderUnifiedhead',
  15. in_channels=(96, 192, 384, 768),
  16. pixel_decoder=dict(type='XTransformerEncoderPixelDecoder'),
  17. transformer_decoder=dict(type='XDecoderTransformerDecoder'),
  18. task='semseg',
  19. ),
  20. # use_thr_for_mc=True means use threshold for multi-class
  21. # This parameter is only used in semantic segmentation task and
  22. # referring semantic segmentation task.
  23. test_cfg=dict(mask_thr=0.5, use_thr_for_mc=True, ignore_index=255),
  24. )
  25. val_cfg = dict(type='ValLoop')
  26. test_cfg = dict(type='TestLoop')