metafile.yml 8.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243
  1. Models:
  2. - Name: retinanet_pvt-t_fpn_1x_coco
  3. In Collection: RetinaNet
  4. Config: configs/pvt/retinanet_pvt-t_fpn_1x_coco.py
  5. Metadata:
  6. Training Memory (GB): 8.5
  7. Epochs: 12
  8. Training Data: COCO
  9. Training Techniques:
  10. - SGD with Momentum
  11. - Weight Decay
  12. Training Resources: 8x NVIDIA V100 GPUs
  13. Architecture:
  14. - PyramidVisionTransformer
  15. Results:
  16. - Task: Object Detection
  17. Dataset: COCO
  18. Metrics:
  19. box AP: 36.6
  20. Weights: https://download.openmmlab.com/mmdetection/v2.0/pvt/retinanet_pvt-t_fpn_1x_coco/retinanet_pvt-t_fpn_1x_coco_20210831_103110-17b566bd.pth
  21. Paper:
  22. URL: https://arxiv.org/abs/2102.12122
  23. Title: "Pyramid Vision Transformer: A Versatile Backbone for Dense Prediction without Convolutions"
  24. README: configs/pvt/README.md
  25. Code:
  26. URL: https://github.com/open-mmlab/mmdetection/blob/v2.17.0/mmdet/models/backbones/pvt.py#L315
  27. Version: 2.17.0
  28. - Name: retinanet_pvt-s_fpn_1x_coco
  29. In Collection: RetinaNet
  30. Config: configs/pvt/retinanet_pvt-s_fpn_1x_coco.py
  31. Metadata:
  32. Training Memory (GB): 14.5
  33. Epochs: 12
  34. Training Data: COCO
  35. Training Techniques:
  36. - SGD with Momentum
  37. - Weight Decay
  38. Training Resources: 8x NVIDIA V100 GPUs
  39. Architecture:
  40. - PyramidVisionTransformer
  41. Results:
  42. - Task: Object Detection
  43. Dataset: COCO
  44. Metrics:
  45. box AP: 40.4
  46. Weights: https://download.openmmlab.com/mmdetection/v2.0/pvt/retinanet_pvt-s_fpn_1x_coco/retinanet_pvt-s_fpn_1x_coco_20210906_142921-b6c94a5b.pth
  47. Paper:
  48. URL: https://arxiv.org/abs/2102.12122
  49. Title: "Pyramid Vision Transformer: A Versatile Backbone for Dense Prediction without Convolutions"
  50. README: configs/pvt/README.md
  51. Code:
  52. URL: https://github.com/open-mmlab/mmdetection/blob/v2.17.0/mmdet/models/backbones/pvt.py#L315
  53. Version: 2.17.0
  54. - Name: retinanet_pvt-m_fpn_1x_coco
  55. In Collection: RetinaNet
  56. Config: configs/pvt/retinanet_pvt-m_fpn_1x_coco.py
  57. Metadata:
  58. Training Memory (GB): 20.9
  59. Epochs: 12
  60. Training Data: COCO
  61. Training Techniques:
  62. - SGD with Momentum
  63. - Weight Decay
  64. Training Resources: 8x NVIDIA V100 GPUs
  65. Architecture:
  66. - PyramidVisionTransformer
  67. Results:
  68. - Task: Object Detection
  69. Dataset: COCO
  70. Metrics:
  71. box AP: 41.7
  72. Weights: https://download.openmmlab.com/mmdetection/v2.0/pvt/retinanet_pvt-m_fpn_1x_coco/retinanet_pvt-m_fpn_1x_coco_20210831_103243-55effa1b.pth
  73. Paper:
  74. URL: https://arxiv.org/abs/2102.12122
  75. Title: "Pyramid Vision Transformer: A Versatile Backbone for Dense Prediction without Convolutions"
  76. README: configs/pvt/README.md
  77. Code:
  78. URL: https://github.com/open-mmlab/mmdetection/blob/v2.17.0/mmdet/models/backbones/pvt.py#L315
  79. Version: 2.17.0
  80. - Name: retinanet_pvtv2-b0_fpn_1x_coco
  81. In Collection: RetinaNet
  82. Config: configs/pvt/retinanet_pvtv2-b0_fpn_1x_coco.py
  83. Metadata:
  84. Training Memory (GB): 7.4
  85. Epochs: 12
  86. Training Data: COCO
  87. Training Techniques:
  88. - SGD with Momentum
  89. - Weight Decay
  90. Training Resources: 8x NVIDIA V100 GPUs
  91. Architecture:
  92. - PyramidVisionTransformerV2
  93. Results:
  94. - Task: Object Detection
  95. Dataset: COCO
  96. Metrics:
  97. box AP: 37.1
  98. Weights: https://download.openmmlab.com/mmdetection/v2.0/pvt/retinanet_pvtv2-b0_fpn_1x_coco/retinanet_pvtv2-b0_fpn_1x_coco_20210831_103157-13e9aabe.pth
  99. Paper:
  100. URL: https://arxiv.org/abs/2106.13797
  101. Title: "PVTv2: Improved Baselines with Pyramid Vision Transformer"
  102. README: configs/pvt/README.md
  103. Code:
  104. URL: https://github.com/open-mmlab/mmdetection/blob/v2.17.0/mmdet/models/backbones/pvt.py#L543
  105. Version: 2.17.0
  106. - Name: retinanet_pvtv2-b1_fpn_1x_coco
  107. In Collection: RetinaNet
  108. Config: configs/pvt/retinanet_pvtv2-b1_fpn_1x_coco.py
  109. Metadata:
  110. Training Memory (GB): 9.5
  111. Epochs: 12
  112. Training Data: COCO
  113. Training Techniques:
  114. - SGD with Momentum
  115. - Weight Decay
  116. Training Resources: 8x NVIDIA V100 GPUs
  117. Architecture:
  118. - PyramidVisionTransformerV2
  119. Results:
  120. - Task: Object Detection
  121. Dataset: COCO
  122. Metrics:
  123. box AP: 41.2
  124. Weights: https://download.openmmlab.com/mmdetection/v2.0/pvt/retinanet_pvtv2-b1_fpn_1x_coco/retinanet_pvtv2-b1_fpn_1x_coco_20210831_103318-7e169a7d.pth
  125. Paper:
  126. URL: https://arxiv.org/abs/2106.13797
  127. Title: "PVTv2: Improved Baselines with Pyramid Vision Transformer"
  128. README: configs/pvt/README.md
  129. Code:
  130. URL: https://github.com/open-mmlab/mmdetection/blob/v2.17.0/mmdet/models/backbones/pvt.py#L543
  131. Version: 2.17.0
  132. - Name: retinanet_pvtv2-b2_fpn_1x_coco
  133. In Collection: RetinaNet
  134. Config: configs/pvt/retinanet_pvtv2-b2_fpn_1x_coco.py
  135. Metadata:
  136. Training Memory (GB): 16.2
  137. Epochs: 12
  138. Training Data: COCO
  139. Training Techniques:
  140. - SGD with Momentum
  141. - Weight Decay
  142. Training Resources: 8x NVIDIA V100 GPUs
  143. Architecture:
  144. - PyramidVisionTransformerV2
  145. Results:
  146. - Task: Object Detection
  147. Dataset: COCO
  148. Metrics:
  149. box AP: 44.6
  150. Weights: https://download.openmmlab.com/mmdetection/v2.0/pvt/retinanet_pvtv2-b2_fpn_1x_coco/retinanet_pvtv2-b2_fpn_1x_coco_20210901_174843-529f0b9a.pth
  151. Paper:
  152. URL: https://arxiv.org/abs/2106.13797
  153. Title: "PVTv2: Improved Baselines with Pyramid Vision Transformer"
  154. README: configs/pvt/README.md
  155. Code:
  156. URL: https://github.com/open-mmlab/mmdetection/blob/v2.17.0/mmdet/models/backbones/pvt.py#L543
  157. Version: 2.17.0
  158. - Name: retinanet_pvtv2-b3_fpn_1x_coco
  159. In Collection: RetinaNet
  160. Config: configs/pvt/retinanet_pvtv2-b3_fpn_1x_coco.py
  161. Metadata:
  162. Training Memory (GB): 23.0
  163. Epochs: 12
  164. Training Data: COCO
  165. Training Techniques:
  166. - SGD with Momentum
  167. - Weight Decay
  168. Training Resources: 8x NVIDIA V100 GPUs
  169. Architecture:
  170. - PyramidVisionTransformerV2
  171. Results:
  172. - Task: Object Detection
  173. Dataset: COCO
  174. Metrics:
  175. box AP: 46.0
  176. Weights: https://download.openmmlab.com/mmdetection/v2.0/pvt/retinanet_pvtv2-b3_fpn_1x_coco/retinanet_pvtv2-b3_fpn_1x_coco_20210903_151512-8357deff.pth
  177. Paper:
  178. URL: https://arxiv.org/abs/2106.13797
  179. Title: "PVTv2: Improved Baselines with Pyramid Vision Transformer"
  180. README: configs/pvt/README.md
  181. Code:
  182. URL: https://github.com/open-mmlab/mmdetection/blob/v2.17.0/mmdet/models/backbones/pvt.py#L543
  183. Version: 2.17.0
  184. - Name: retinanet_pvtv2-b4_fpn_1x_coco
  185. In Collection: RetinaNet
  186. Config: configs/pvt/retinanet_pvtv2-b4_fpn_1x_coco.py
  187. Metadata:
  188. Training Memory (GB): 17.0
  189. Epochs: 12
  190. Training Data: COCO
  191. Training Techniques:
  192. - SGD with Momentum
  193. - Weight Decay
  194. Training Resources: 8x NVIDIA V100 GPUs
  195. Architecture:
  196. - PyramidVisionTransformerV2
  197. Results:
  198. - Task: Object Detection
  199. Dataset: COCO
  200. Metrics:
  201. box AP: 46.3
  202. Weights: https://download.openmmlab.com/mmdetection/v2.0/pvt/retinanet_pvtv2-b4_fpn_1x_coco/retinanet_pvtv2-b4_fpn_1x_coco_20210901_170151-83795c86.pth
  203. Paper:
  204. URL: https://arxiv.org/abs/2106.13797
  205. Title: "PVTv2: Improved Baselines with Pyramid Vision Transformer"
  206. README: configs/pvt/README.md
  207. Code:
  208. URL: https://github.com/open-mmlab/mmdetection/blob/v2.17.0/mmdet/models/backbones/pvt.py#L543
  209. Version: 2.17.0
  210. - Name: retinanet_pvtv2-b5_fpn_1x_coco
  211. In Collection: RetinaNet
  212. Config: configs/pvt/retinanet_pvtv2-b5_fpn_1x_coco.py
  213. Metadata:
  214. Training Memory (GB): 18.7
  215. Epochs: 12
  216. Training Data: COCO
  217. Training Techniques:
  218. - SGD with Momentum
  219. - Weight Decay
  220. Training Resources: 8x NVIDIA V100 GPUs
  221. Architecture:
  222. - PyramidVisionTransformerV2
  223. Results:
  224. - Task: Object Detection
  225. Dataset: COCO
  226. Metrics:
  227. box AP: 46.1
  228. Weights: https://download.openmmlab.com/mmdetection/v2.0/pvt/retinanet_pvtv2-b5_fpn_1x_coco/retinanet_pvtv2-b5_fpn_1x_coco_20210902_201800-3420eb57.pth
  229. Paper:
  230. URL: https://arxiv.org/abs/2106.13797
  231. Title: "PVTv2: Improved Baselines with Pyramid Vision Transformer"
  232. README: configs/pvt/README.md
  233. Code:
  234. URL: https://github.com/open-mmlab/mmdetection/blob/v2.17.0/mmdet/models/backbones/pvt.py#L543
  235. Version: 2.17.0