lad_r50-paa-r101_fpn_2xb8_coco_1x.py 3.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126
  1. _base_ = [
  2. '../_base_/datasets/coco_detection.py',
  3. '../_base_/schedules/schedule_1x.py', '../_base_/default_runtime.py'
  4. ]
  5. teacher_ckpt = 'http://download.openmmlab.com/mmdetection/v2.0/paa/paa_r101_fpn_1x_coco/paa_r101_fpn_1x_coco_20200821-0a1825a4.pth' # noqa
  6. model = dict(
  7. type='LAD',
  8. data_preprocessor=dict(
  9. type='DetDataPreprocessor',
  10. mean=[123.675, 116.28, 103.53],
  11. std=[58.395, 57.12, 57.375],
  12. bgr_to_rgb=True,
  13. pad_size_divisor=32),
  14. # student
  15. backbone=dict(
  16. type='ResNet',
  17. depth=50,
  18. num_stages=4,
  19. out_indices=(0, 1, 2, 3),
  20. frozen_stages=1,
  21. norm_cfg=dict(type='BN', requires_grad=True),
  22. norm_eval=True,
  23. style='pytorch',
  24. init_cfg=dict(type='Pretrained', checkpoint='torchvision://resnet50')),
  25. neck=dict(
  26. type='FPN',
  27. in_channels=[256, 512, 1024, 2048],
  28. out_channels=256,
  29. start_level=1,
  30. add_extra_convs='on_output',
  31. num_outs=5),
  32. bbox_head=dict(
  33. type='LADHead',
  34. reg_decoded_bbox=True,
  35. score_voting=True,
  36. topk=9,
  37. num_classes=80,
  38. in_channels=256,
  39. stacked_convs=4,
  40. feat_channels=256,
  41. anchor_generator=dict(
  42. type='AnchorGenerator',
  43. ratios=[1.0],
  44. octave_base_scale=8,
  45. scales_per_octave=1,
  46. strides=[8, 16, 32, 64, 128]),
  47. bbox_coder=dict(
  48. type='DeltaXYWHBBoxCoder',
  49. target_means=[.0, .0, .0, .0],
  50. target_stds=[0.1, 0.1, 0.2, 0.2]),
  51. loss_cls=dict(
  52. type='FocalLoss',
  53. use_sigmoid=True,
  54. gamma=2.0,
  55. alpha=0.25,
  56. loss_weight=1.0),
  57. loss_bbox=dict(type='GIoULoss', loss_weight=1.3),
  58. loss_centerness=dict(
  59. type='CrossEntropyLoss', use_sigmoid=True, loss_weight=0.5)),
  60. # teacher
  61. teacher_ckpt=teacher_ckpt,
  62. teacher_backbone=dict(
  63. type='ResNet',
  64. depth=101,
  65. num_stages=4,
  66. out_indices=(0, 1, 2, 3),
  67. frozen_stages=1,
  68. norm_cfg=dict(type='BN', requires_grad=True),
  69. norm_eval=True,
  70. style='pytorch'),
  71. teacher_neck=dict(
  72. type='FPN',
  73. in_channels=[256, 512, 1024, 2048],
  74. out_channels=256,
  75. start_level=1,
  76. add_extra_convs='on_output',
  77. num_outs=5),
  78. teacher_bbox_head=dict(
  79. type='LADHead',
  80. reg_decoded_bbox=True,
  81. score_voting=True,
  82. topk=9,
  83. num_classes=80,
  84. in_channels=256,
  85. stacked_convs=4,
  86. feat_channels=256,
  87. anchor_generator=dict(
  88. type='AnchorGenerator',
  89. ratios=[1.0],
  90. octave_base_scale=8,
  91. scales_per_octave=1,
  92. strides=[8, 16, 32, 64, 128]),
  93. bbox_coder=dict(
  94. type='DeltaXYWHBBoxCoder',
  95. target_means=[.0, .0, .0, .0],
  96. target_stds=[0.1, 0.1, 0.2, 0.2]),
  97. loss_cls=dict(
  98. type='FocalLoss',
  99. use_sigmoid=True,
  100. gamma=2.0,
  101. alpha=0.25,
  102. loss_weight=1.0),
  103. loss_bbox=dict(type='GIoULoss', loss_weight=1.3),
  104. loss_centerness=dict(
  105. type='CrossEntropyLoss', use_sigmoid=True, loss_weight=0.5)),
  106. # training and testing settings
  107. train_cfg=dict(
  108. assigner=dict(
  109. type='MaxIoUAssigner',
  110. pos_iou_thr=0.1,
  111. neg_iou_thr=0.1,
  112. min_pos_iou=0,
  113. ignore_iof_thr=-1),
  114. allowed_border=-1,
  115. pos_weight=-1,
  116. debug=False),
  117. test_cfg=dict(
  118. nms_pre=1000,
  119. min_bbox_size=0,
  120. score_thr=0.05,
  121. score_voting=True,
  122. nms=dict(type='nms', iou_threshold=0.6),
  123. max_per_img=100))
  124. train_dataloader = dict(batch_size=8, num_workers=4)
  125. optim_wrapper = dict(type='AmpOptimWrapper', optimizer=dict(lr=0.01))