resnetv1d_coco.md 4.6 KB

ResNetV1D (CVPR'2019)
@inproceedings{he2019bag,
  title={Bag of tricks for image classification with convolutional neural networks},
  author={He, Tong and Zhang, Zhi and Zhang, Hang and Zhang, Zhongyue and Xie, Junyuan and Li, Mu},
  booktitle={Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition},
  pages={558--567},
  year={2019}
}

COCO (ECCV'2014)
@inproceedings{lin2014microsoft,
  title={Microsoft coco: Common objects in context},
  author={Lin, Tsung-Yi and Maire, Michael and Belongie, Serge and Hays, James and Perona, Pietro and Ramanan, Deva and Doll{\'a}r, Piotr and Zitnick, C Lawrence},
  booktitle={European conference on computer vision},
  pages={740--755},
  year={2014},
  organization={Springer}
}

Results on COCO val2017 with detector having human AP of 56.4 on COCO val2017 dataset

Arch Input Size AP AP50 AP75 AR AR50 ckpt log
pose_resnetv1d_50 256x192 0.722 0.897 0.796 0.777 0.936 ckpt log
pose_resnetv1d_50 384x288 0.730 0.899 0.800 0.782 0.935 ckpt log
pose_resnetv1d_101 256x192 0.732 0.901 0.808 0.785 0.940 ckpt log
pose_resnetv1d_101 384x288 0.748 0.906 0.817 0.798 0.941 ckpt log
pose_resnetv1d_152 256x192 0.737 0.904 0.814 0.790 0.940 ckpt log
pose_resnetv1d_152 384x288 0.751 0.907 0.821 0.801 0.942 ckpt log