mask-rcnn_r50_fpn_albu-1x_coco.py 1.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566
  1. _base_ = '../mask_rcnn/mask-rcnn_r50_fpn_1x_coco.py'
  2. albu_train_transforms = [
  3. dict(
  4. type='ShiftScaleRotate',
  5. shift_limit=0.0625,
  6. scale_limit=0.0,
  7. rotate_limit=0,
  8. interpolation=1,
  9. p=0.5),
  10. dict(
  11. type='RandomBrightnessContrast',
  12. brightness_limit=[0.1, 0.3],
  13. contrast_limit=[0.1, 0.3],
  14. p=0.2),
  15. dict(
  16. type='OneOf',
  17. transforms=[
  18. dict(
  19. type='RGBShift',
  20. r_shift_limit=10,
  21. g_shift_limit=10,
  22. b_shift_limit=10,
  23. p=1.0),
  24. dict(
  25. type='HueSaturationValue',
  26. hue_shift_limit=20,
  27. sat_shift_limit=30,
  28. val_shift_limit=20,
  29. p=1.0)
  30. ],
  31. p=0.1),
  32. dict(type='JpegCompression', quality_lower=85, quality_upper=95, p=0.2),
  33. dict(type='ChannelShuffle', p=0.1),
  34. dict(
  35. type='OneOf',
  36. transforms=[
  37. dict(type='Blur', blur_limit=3, p=1.0),
  38. dict(type='MedianBlur', blur_limit=3, p=1.0)
  39. ],
  40. p=0.1),
  41. ]
  42. train_pipeline = [
  43. dict(type='LoadImageFromFile', backend_args={{_base_.backend_args}}),
  44. dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
  45. dict(type='Resize', scale=(1333, 800), keep_ratio=True),
  46. dict(
  47. type='Albu',
  48. transforms=albu_train_transforms,
  49. bbox_params=dict(
  50. type='BboxParams',
  51. format='pascal_voc',
  52. label_fields=['gt_bboxes_labels', 'gt_ignore_flags'],
  53. min_visibility=0.0,
  54. filter_lost_elements=True),
  55. keymap={
  56. 'img': 'image',
  57. 'gt_masks': 'masks',
  58. 'gt_bboxes': 'bboxes'
  59. },
  60. skip_img_without_anno=True),
  61. dict(type='RandomFlip', prob=0.5),
  62. dict(type='PackDetInputs')
  63. ]
  64. train_dataloader = dict(dataset=dict(pipeline=train_pipeline))