sparse-rcnn_r50_fpn_300-proposals_crop-ms-480-800-3x_coco.py 1.8 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243
  1. _base_ = './sparse-rcnn_r50_fpn_ms-480-800-3x_coco.py'
  2. num_proposals = 300
  3. model = dict(
  4. rpn_head=dict(num_proposals=num_proposals),
  5. test_cfg=dict(
  6. _delete_=True, rpn=None, rcnn=dict(max_per_img=num_proposals)))
  7. # augmentation strategy originates from DETR.
  8. train_pipeline = [
  9. dict(type='LoadImageFromFile', backend_args={{_base_.backend_args}}),
  10. dict(type='LoadAnnotations', with_bbox=True),
  11. dict(type='RandomFlip', prob=0.5),
  12. dict(
  13. type='RandomChoice',
  14. transforms=[[
  15. dict(
  16. type='RandomChoiceResize',
  17. scales=[(480, 1333), (512, 1333), (544, 1333), (576, 1333),
  18. (608, 1333), (640, 1333), (672, 1333), (704, 1333),
  19. (736, 1333), (768, 1333), (800, 1333)],
  20. keep_ratio=True)
  21. ],
  22. [
  23. dict(
  24. type='RandomChoiceResize',
  25. scales=[(400, 1333), (500, 1333), (600, 1333)],
  26. keep_ratio=True),
  27. dict(
  28. type='RandomCrop',
  29. crop_type='absolute_range',
  30. crop_size=(384, 600),
  31. allow_negative_crop=True),
  32. dict(
  33. type='RandomChoiceResize',
  34. scales=[(480, 1333), (512, 1333), (544, 1333),
  35. (576, 1333), (608, 1333), (640, 1333),
  36. (672, 1333), (704, 1333), (736, 1333),
  37. (768, 1333), (800, 1333)],
  38. keep_ratio=True)
  39. ]]),
  40. dict(type='PackDetInputs')
  41. ]
  42. train_dataloader = dict(dataset=dict(pipeline=train_pipeline))