lad_r101-paa-r50_fpn_2xb8_coco_1x.py 3.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127
  1. _base_ = [
  2. '../_base_/datasets/coco_detection.py',
  3. '../_base_/schedules/schedule_1x.py', '../_base_/default_runtime.py'
  4. ]
  5. teacher_ckpt = 'https://download.openmmlab.com/mmdetection/v2.0/paa/paa_r50_fpn_1x_coco/paa_r50_fpn_1x_coco_20200821-936edec3.pth' # noqa
  6. model = dict(
  7. type='LAD',
  8. data_preprocessor=dict(
  9. type='DetDataPreprocessor',
  10. mean=[123.675, 116.28, 103.53],
  11. std=[58.395, 57.12, 57.375],
  12. bgr_to_rgb=True,
  13. pad_size_divisor=32),
  14. # student
  15. backbone=dict(
  16. type='ResNet',
  17. depth=101,
  18. num_stages=4,
  19. out_indices=(0, 1, 2, 3),
  20. frozen_stages=1,
  21. norm_cfg=dict(type='BN', requires_grad=True),
  22. norm_eval=True,
  23. style='pytorch',
  24. init_cfg=dict(type='Pretrained',
  25. checkpoint='torchvision://resnet101')),
  26. neck=dict(
  27. type='FPN',
  28. in_channels=[256, 512, 1024, 2048],
  29. out_channels=256,
  30. start_level=1,
  31. add_extra_convs='on_output',
  32. num_outs=5),
  33. bbox_head=dict(
  34. type='LADHead',
  35. reg_decoded_bbox=True,
  36. score_voting=True,
  37. topk=9,
  38. num_classes=80,
  39. in_channels=256,
  40. stacked_convs=4,
  41. feat_channels=256,
  42. anchor_generator=dict(
  43. type='AnchorGenerator',
  44. ratios=[1.0],
  45. octave_base_scale=8,
  46. scales_per_octave=1,
  47. strides=[8, 16, 32, 64, 128]),
  48. bbox_coder=dict(
  49. type='DeltaXYWHBBoxCoder',
  50. target_means=[.0, .0, .0, .0],
  51. target_stds=[0.1, 0.1, 0.2, 0.2]),
  52. loss_cls=dict(
  53. type='FocalLoss',
  54. use_sigmoid=True,
  55. gamma=2.0,
  56. alpha=0.25,
  57. loss_weight=1.0),
  58. loss_bbox=dict(type='GIoULoss', loss_weight=1.3),
  59. loss_centerness=dict(
  60. type='CrossEntropyLoss', use_sigmoid=True, loss_weight=0.5)),
  61. # teacher
  62. teacher_ckpt=teacher_ckpt,
  63. teacher_backbone=dict(
  64. type='ResNet',
  65. depth=50,
  66. num_stages=4,
  67. out_indices=(0, 1, 2, 3),
  68. frozen_stages=1,
  69. norm_cfg=dict(type='BN', requires_grad=True),
  70. norm_eval=True,
  71. style='pytorch'),
  72. teacher_neck=dict(
  73. type='FPN',
  74. in_channels=[256, 512, 1024, 2048],
  75. out_channels=256,
  76. start_level=1,
  77. add_extra_convs='on_output',
  78. num_outs=5),
  79. teacher_bbox_head=dict(
  80. type='LADHead',
  81. reg_decoded_bbox=True,
  82. score_voting=True,
  83. topk=9,
  84. num_classes=80,
  85. in_channels=256,
  86. stacked_convs=4,
  87. feat_channels=256,
  88. anchor_generator=dict(
  89. type='AnchorGenerator',
  90. ratios=[1.0],
  91. octave_base_scale=8,
  92. scales_per_octave=1,
  93. strides=[8, 16, 32, 64, 128]),
  94. bbox_coder=dict(
  95. type='DeltaXYWHBBoxCoder',
  96. target_means=[.0, .0, .0, .0],
  97. target_stds=[0.1, 0.1, 0.2, 0.2]),
  98. loss_cls=dict(
  99. type='FocalLoss',
  100. use_sigmoid=True,
  101. gamma=2.0,
  102. alpha=0.25,
  103. loss_weight=1.0),
  104. loss_bbox=dict(type='GIoULoss', loss_weight=1.3),
  105. loss_centerness=dict(
  106. type='CrossEntropyLoss', use_sigmoid=True, loss_weight=0.5)),
  107. # training and testing settings
  108. train_cfg=dict(
  109. assigner=dict(
  110. type='MaxIoUAssigner',
  111. pos_iou_thr=0.1,
  112. neg_iou_thr=0.1,
  113. min_pos_iou=0,
  114. ignore_iof_thr=-1),
  115. allowed_border=-1,
  116. pos_weight=-1,
  117. debug=False),
  118. test_cfg=dict(
  119. nms_pre=1000,
  120. min_bbox_size=0,
  121. score_thr=0.05,
  122. score_voting=True,
  123. nms=dict(type='nms', iou_threshold=0.6),
  124. max_per_img=100))
  125. train_dataloader = dict(batch_size=8, num_workers=4)
  126. optim_wrapper = dict(type='AmpOptimWrapper', optimizer=dict(lr=0.01))