Hand(2D)¶
Freihand2d Dataset¶
Topdown Heatmap + Resnet on Freihand2d¶
SimpleBaseline2D (ECCV'2018)
@inproceedings{xiao2018simple,
title={Simple baselines for human pose estimation and tracking},
author={Xiao, Bin and Wu, Haiping and Wei, Yichen},
booktitle={Proceedings of the European conference on computer vision (ECCV)},
pages={466--481},
year={2018}
}
ResNet (CVPR'2016)
@inproceedings{he2016deep,
title={Deep residual learning for image recognition},
author={He, Kaiming and Zhang, Xiangyu and Ren, Shaoqing and Sun, Jian},
booktitle={Proceedings of the IEEE conference on computer vision and pattern recognition},
pages={770--778},
year={2016}
}
FreiHand (ICCV'2019)
@inproceedings{zimmermann2019freihand,
title={Freihand: A dataset for markerless capture of hand pose and shape from single rgb images},
author={Zimmermann, Christian and Ceylan, Duygu and Yang, Jimei and Russell, Bryan and Argus, Max and Brox, Thomas},
booktitle={Proceedings of the IEEE International Conference on Computer Vision},
pages={813--822},
year={2019}
}
Results on FreiHand val & test set
Set | Arch | Input Size | PCK@0.2 | AUC | EPE | ckpt | log |
---|---|---|---|---|---|---|---|
val | pose_resnet_50 | 224x224 | 0.993 | 0.868 | 3.25 | ckpt | log |
test | pose_resnet_50 | 224x224 | 0.992 | 0.868 | 3.27 | ckpt | log |
Interhand2d Dataset¶
Topdown Heatmap + Resnet on Interhand2d¶
SimpleBaseline2D (ECCV'2018)
@inproceedings{xiao2018simple,
title={Simple baselines for human pose estimation and tracking},
author={Xiao, Bin and Wu, Haiping and Wei, Yichen},
booktitle={Proceedings of the European conference on computer vision (ECCV)},
pages={466--481},
year={2018}
}
ResNet (CVPR'2016)
@inproceedings{he2016deep,
title={Deep residual learning for image recognition},
author={He, Kaiming and Zhang, Xiangyu and Ren, Shaoqing and Sun, Jian},
booktitle={Proceedings of the IEEE conference on computer vision and pattern recognition},
pages={770--778},
year={2016}
}
InterHand2.6M (ECCV'2020)
@InProceedings{Moon_2020_ECCV_InterHand2.6M,
author = {Moon, Gyeongsik and Yu, Shoou-I and Wen, He and Shiratori, Takaaki and Lee, Kyoung Mu},
title = {InterHand2.6M: A Dataset and Baseline for 3D Interacting Hand Pose Estimation from a Single RGB Image},
booktitle = {European Conference on Computer Vision (ECCV)},
year = {2020}
}
Results on InterHand2.6M val & test set
Train Set | Set | Arch | Input Size | PCK@0.2 | AUC | EPE | ckpt | log |
---|---|---|---|---|---|---|---|---|
Human_annot | val(M) | pose_resnet_50 | 256x256 | 0.973 | 0.828 | 5.15 | ckpt | log |
Human_annot | test(H) | pose_resnet_50 | 256x256 | 0.973 | 0.826 | 5.27 | ckpt | log |
Human_annot | test(M) | pose_resnet_50 | 256x256 | 0.975 | 0.841 | 4.90 | ckpt | log |
Human_annot | test(H+M) | pose_resnet_50 | 256x256 | 0.975 | 0.839 | 4.97 | ckpt | log |
Machine_annot | val(M) | pose_resnet_50 | 256x256 | 0.970 | 0.824 | 5.39 | ckpt | log |
Machine_annot | test(H) | pose_resnet_50 | 256x256 | 0.969 | 0.821 | 5.52 | ckpt | log |
Machine_annot | test(M) | pose_resnet_50 | 256x256 | 0.972 | 0.838 | 5.03 | ckpt | log |
Machine_annot | test(H+M) | pose_resnet_50 | 256x256 | 0.972 | 0.837 | 5.11 | ckpt | log |
All | val(M) | pose_resnet_50 | 256x256 | 0.977 | 0.840 | 4.66 | ckpt | log |
All | test(H) | pose_resnet_50 | 256x256 | 0.979 | 0.839 | 4.65 | ckpt | log |
All | test(M) | pose_resnet_50 | 256x256 | 0.979 | 0.838 | 4.42 | ckpt | log |
All | test(H+M) | pose_resnet_50 | 256x256 | 0.979 | 0.851 | 4.46 | ckpt | log |
Onehand10k Dataset¶
Deeppose + Resnet on Onehand10k¶
DeepPose (CVPR'2014)
@inproceedings{toshev2014deeppose,
title={Deeppose: Human pose estimation via deep neural networks},
author={Toshev, Alexander and Szegedy, Christian},
booktitle={Proceedings of the IEEE conference on computer vision and pattern recognition},
pages={1653--1660},
year={2014}
}
ResNet (CVPR'2016)
@inproceedings{he2016deep,
title={Deep residual learning for image recognition},
author={He, Kaiming and Zhang, Xiangyu and Ren, Shaoqing and Sun, Jian},
booktitle={Proceedings of the IEEE conference on computer vision and pattern recognition},
pages={770--778},
year={2016}
}
OneHand10K (TCSVT'2019)
@article{wang2018mask,
title={Mask-pose cascaded cnn for 2d hand pose estimation from single color image},
author={Wang, Yangang and Peng, Cong and Liu, Yebin},
journal={IEEE Transactions on Circuits and Systems for Video Technology},
volume={29},
number={11},
pages={3258--3268},
year={2018},
publisher={IEEE}
}
Results on OneHand10K val set
Arch | Input Size | PCK@0.2 | AUC | EPE | ckpt | log |
---|---|---|---|---|---|---|
deeppose_resnet_50 | 256x256 | 0.990 | 0.486 | 34.28 | ckpt | log |
Topdown Heatmap + Mobilenetv2 on Onehand10k¶
MobilenetV2 (CVPR'2018)
@inproceedings{sandler2018mobilenetv2,
title={Mobilenetv2: Inverted residuals and linear bottlenecks},
author={Sandler, Mark and Howard, Andrew and Zhu, Menglong and Zhmoginov, Andrey and Chen, Liang-Chieh},
booktitle={Proceedings of the IEEE conference on computer vision and pattern recognition},
pages={4510--4520},
year={2018}
}
OneHand10K (TCSVT'2019)
@article{wang2018mask,
title={Mask-pose cascaded cnn for 2d hand pose estimation from single color image},
author={Wang, Yangang and Peng, Cong and Liu, Yebin},
journal={IEEE Transactions on Circuits and Systems for Video Technology},
volume={29},
number={11},
pages={3258--3268},
year={2018},
publisher={IEEE}
}
Results on OneHand10K val set
Arch | Input Size | PCK@0.2 | AUC | EPE | ckpt | log |
---|---|---|---|---|---|---|
pose_mobilenet_v2 | 256x256 | 0.986 | 0.537 | 28.60 | ckpt | log |
Topdown Heatmap + Hrnetv2 + Udp on Onehand10k¶
HRNetv2 (TPAMI'2019)
@article{WangSCJDZLMTWLX19,
title={Deep High-Resolution Representation Learning for Visual Recognition},
author={Jingdong Wang and Ke Sun and Tianheng Cheng and
Borui Jiang and Chaorui Deng and Yang Zhao and Dong Liu and Yadong Mu and
Mingkui Tan and Xinggang Wang and Wenyu Liu and Bin Xiao},
journal={TPAMI},
year={2019}
}
UDP (CVPR'2020)
@InProceedings{Huang_2020_CVPR,
author = {Huang, Junjie and Zhu, Zheng and Guo, Feng and Huang, Guan},
title = {The Devil Is in the Details: Delving Into Unbiased Data Processing for Human Pose Estimation},
booktitle = {The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)},
month = {June},
year = {2020}
}
OneHand10K (TCSVT'2019)
@article{wang2018mask,
title={Mask-pose cascaded cnn for 2d hand pose estimation from single color image},
author={Wang, Yangang and Peng, Cong and Liu, Yebin},
journal={IEEE Transactions on Circuits and Systems for Video Technology},
volume={29},
number={11},
pages={3258--3268},
year={2018},
publisher={IEEE}
}
Results on OneHand10K val set
Arch | Input Size | PCK@0.2 | AUC | EPE | ckpt | log |
---|---|---|---|---|---|---|
pose_hrnetv2_w18_udp | 256x256 | 0.990 | 0.572 | 23.87 | ckpt | log |
Topdown Heatmap + Resnet on Onehand10k¶
SimpleBaseline2D (ECCV'2018)
@inproceedings{xiao2018simple,
title={Simple baselines for human pose estimation and tracking},
author={Xiao, Bin and Wu, Haiping and Wei, Yichen},
booktitle={Proceedings of the European conference on computer vision (ECCV)},
pages={466--481},
year={2018}
}
ResNet (CVPR'2016)
@inproceedings{he2016deep,
title={Deep residual learning for image recognition},
author={He, Kaiming and Zhang, Xiangyu and Ren, Shaoqing and Sun, Jian},
booktitle={Proceedings of the IEEE conference on computer vision and pattern recognition},
pages={770--778},
year={2016}
}
OneHand10K (TCSVT'2019)
@article{wang2018mask,
title={Mask-pose cascaded cnn for 2d hand pose estimation from single color image},
author={Wang, Yangang and Peng, Cong and Liu, Yebin},
journal={IEEE Transactions on Circuits and Systems for Video Technology},
volume={29},
number={11},
pages={3258--3268},
year={2018},
publisher={IEEE}
}
Results on OneHand10K val set
Arch | Input Size | PCK@0.2 | AUC | EPE | ckpt | log |
---|---|---|---|---|---|---|
pose_resnet_50 | 256x256 | 0.989 | 0.555 | 25.19 | ckpt | log |
Topdown Heatmap + Hrnetv2 on Onehand10k¶
HRNetv2 (TPAMI'2019)
@article{WangSCJDZLMTWLX19,
title={Deep High-Resolution Representation Learning for Visual Recognition},
author={Jingdong Wang and Ke Sun and Tianheng Cheng and
Borui Jiang and Chaorui Deng and Yang Zhao and Dong Liu and Yadong Mu and
Mingkui Tan and Xinggang Wang and Wenyu Liu and Bin Xiao},
journal={TPAMI},
year={2019}
}
OneHand10K (TCSVT'2019)
@article{wang2018mask,
title={Mask-pose cascaded cnn for 2d hand pose estimation from single color image},
author={Wang, Yangang and Peng, Cong and Liu, Yebin},
journal={IEEE Transactions on Circuits and Systems for Video Technology},
volume={29},
number={11},
pages={3258--3268},
year={2018},
publisher={IEEE}
}
Results on OneHand10K val set
Arch | Input Size | PCK@0.2 | AUC | EPE | ckpt | log |
---|---|---|---|---|---|---|
pose_hrnetv2_w18 | 256x256 | 0.990 | 0.568 | 24.16 | ckpt | log |
Topdown Heatmap + Hrnetv2 + Dark on Onehand10k¶
HRNetv2 (TPAMI'2019)
@article{WangSCJDZLMTWLX19,
title={Deep High-Resolution Representation Learning for Visual Recognition},
author={Jingdong Wang and Ke Sun and Tianheng Cheng and
Borui Jiang and Chaorui Deng and Yang Zhao and Dong Liu and Yadong Mu and
Mingkui Tan and Xinggang Wang and Wenyu Liu and Bin Xiao},
journal={TPAMI},
year={2019}
}
DarkPose (CVPR'2020)
@inproceedings{zhang2020distribution,
title={Distribution-aware coordinate representation for human pose estimation},
author={Zhang, Feng and Zhu, Xiatian and Dai, Hanbin and Ye, Mao and Zhu, Ce},
booktitle={Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition},
pages={7093--7102},
year={2020}
}
OneHand10K (TCSVT'2019)
@article{wang2018mask,
title={Mask-pose cascaded cnn for 2d hand pose estimation from single color image},
author={Wang, Yangang and Peng, Cong and Liu, Yebin},
journal={IEEE Transactions on Circuits and Systems for Video Technology},
volume={29},
number={11},
pages={3258--3268},
year={2018},
publisher={IEEE}
}
Results on OneHand10K val set
Arch | Input Size | PCK@0.2 | AUC | EPE | ckpt | log |
---|---|---|---|---|---|---|
pose_hrnetv2_w18_dark | 256x256 | 0.990 | 0.573 | 23.84 | ckpt | log |
Panoptic2d Dataset¶
Deeppose + Resnet on Panoptic2d¶
DeepPose (CVPR'2014)
@inproceedings{toshev2014deeppose,
title={Deeppose: Human pose estimation via deep neural networks},
author={Toshev, Alexander and Szegedy, Christian},
booktitle={Proceedings of the IEEE conference on computer vision and pattern recognition},
pages={1653--1660},
year={2014}
}
ResNet (CVPR'2016)
@inproceedings{he2016deep,
title={Deep residual learning for image recognition},
author={He, Kaiming and Zhang, Xiangyu and Ren, Shaoqing and Sun, Jian},
booktitle={Proceedings of the IEEE conference on computer vision and pattern recognition},
pages={770--778},
year={2016}
}
CMU Panoptic HandDB (CVPR'2017)
@inproceedings{simon2017hand,
title={Hand keypoint detection in single images using multiview bootstrapping},
author={Simon, Tomas and Joo, Hanbyul and Matthews, Iain and Sheikh, Yaser},
booktitle={Proceedings of the IEEE conference on Computer Vision and Pattern Recognition},
pages={1145--1153},
year={2017}
}
Results on CMU Panoptic (MPII+NZSL val set)
Arch | Input Size | PCKh@0.7 | AUC | EPE | ckpt | log |
---|---|---|---|---|---|---|
deeppose_resnet_50 | 256x256 | 0.999 | 0.686 | 9.36 | ckpt | log |
Topdown Heatmap + Hrnetv2 on Panoptic2d¶
HRNetv2 (TPAMI'2019)
@article{WangSCJDZLMTWLX19,
title={Deep High-Resolution Representation Learning for Visual Recognition},
author={Jingdong Wang and Ke Sun and Tianheng Cheng and
Borui Jiang and Chaorui Deng and Yang Zhao and Dong Liu and Yadong Mu and
Mingkui Tan and Xinggang Wang and Wenyu Liu and Bin Xiao},
journal={TPAMI},
year={2019}
}
CMU Panoptic HandDB (CVPR'2017)
@inproceedings{simon2017hand,
title={Hand keypoint detection in single images using multiview bootstrapping},
author={Simon, Tomas and Joo, Hanbyul and Matthews, Iain and Sheikh, Yaser},
booktitle={Proceedings of the IEEE conference on Computer Vision and Pattern Recognition},
pages={1145--1153},
year={2017}
}
Results on CMU Panoptic (MPII+NZSL val set)
Arch | Input Size | PCKh@0.7 | AUC | EPE | ckpt | log |
---|---|---|---|---|---|---|
pose_hrnetv2_w18 | 256x256 | 0.999 | 0.744 | 7.79 | ckpt | log |
Topdown Heatmap + Mobilenetv2 on Panoptic2d¶
MobilenetV2 (CVPR'2018)
@inproceedings{sandler2018mobilenetv2,
title={Mobilenetv2: Inverted residuals and linear bottlenecks},
author={Sandler, Mark and Howard, Andrew and Zhu, Menglong and Zhmoginov, Andrey and Chen, Liang-Chieh},
booktitle={Proceedings of the IEEE conference on computer vision and pattern recognition},
pages={4510--4520},
year={2018}
}
CMU Panoptic HandDB (CVPR'2017)
@inproceedings{simon2017hand,
title={Hand keypoint detection in single images using multiview bootstrapping},
author={Simon, Tomas and Joo, Hanbyul and Matthews, Iain and Sheikh, Yaser},
booktitle={Proceedings of the IEEE conference on Computer Vision and Pattern Recognition},
pages={1145--1153},
year={2017}
}
Results on CMU Panoptic (MPII+NZSL val set)
Arch | Input Size | PCKh@0.7 | AUC | EPE | ckpt | log |
---|---|---|---|---|---|---|
pose_mobilenet_v2 | 256x256 | 0.998 | 0.694 | 9.70 | ckpt | log |
Topdown Heatmap + Resnet on Panoptic2d¶
SimpleBaseline2D (ECCV'2018)
@inproceedings{xiao2018simple,
title={Simple baselines for human pose estimation and tracking},
author={Xiao, Bin and Wu, Haiping and Wei, Yichen},
booktitle={Proceedings of the European conference on computer vision (ECCV)},
pages={466--481},
year={2018}
}
ResNet (CVPR'2016)
@inproceedings{he2016deep,
title={Deep residual learning for image recognition},
author={He, Kaiming and Zhang, Xiangyu and Ren, Shaoqing and Sun, Jian},
booktitle={Proceedings of the IEEE conference on computer vision and pattern recognition},
pages={770--778},
year={2016}
}
CMU Panoptic HandDB (CVPR'2017)
@inproceedings{simon2017hand,
title={Hand keypoint detection in single images using multiview bootstrapping},
author={Simon, Tomas and Joo, Hanbyul and Matthews, Iain and Sheikh, Yaser},
booktitle={Proceedings of the IEEE conference on Computer Vision and Pattern Recognition},
pages={1145--1153},
year={2017}
}
Results on CMU Panoptic (MPII+NZSL val set)
Arch | Input Size | PCKh@0.7 | AUC | EPE | ckpt | log |
---|---|---|---|---|---|---|
pose_resnet_50 | 256x256 | 0.999 | 0.713 | 9.00 | ckpt | log |
Topdown Heatmap + Hrnetv2 + Dark on Panoptic2d¶
HRNetv2 (TPAMI'2019)
@article{WangSCJDZLMTWLX19,
title={Deep High-Resolution Representation Learning for Visual Recognition},
author={Jingdong Wang and Ke Sun and Tianheng Cheng and
Borui Jiang and Chaorui Deng and Yang Zhao and Dong Liu and Yadong Mu and
Mingkui Tan and Xinggang Wang and Wenyu Liu and Bin Xiao},
journal={TPAMI},
year={2019}
}
DarkPose (CVPR'2020)
@inproceedings{zhang2020distribution,
title={Distribution-aware coordinate representation for human pose estimation},
author={Zhang, Feng and Zhu, Xiatian and Dai, Hanbin and Ye, Mao and Zhu, Ce},
booktitle={Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition},
pages={7093--7102},
year={2020}
}
CMU Panoptic HandDB (CVPR'2017)
@inproceedings{simon2017hand,
title={Hand keypoint detection in single images using multiview bootstrapping},
author={Simon, Tomas and Joo, Hanbyul and Matthews, Iain and Sheikh, Yaser},
booktitle={Proceedings of the IEEE conference on Computer Vision and Pattern Recognition},
pages={1145--1153},
year={2017}
}
Results on CMU Panoptic (MPII+NZSL val set)
Arch | Input Size | PCKh@0.7 | AUC | EPE | ckpt | log |
---|---|---|---|---|---|---|
pose_hrnetv2_w18_dark | 256x256 | 0.999 | 0.745 | 7.77 | ckpt | log |
Topdown Heatmap + Hrnetv2 + Udp on Panoptic2d¶
HRNetv2 (TPAMI'2019)
@article{WangSCJDZLMTWLX19,
title={Deep High-Resolution Representation Learning for Visual Recognition},
author={Jingdong Wang and Ke Sun and Tianheng Cheng and
Borui Jiang and Chaorui Deng and Yang Zhao and Dong Liu and Yadong Mu and
Mingkui Tan and Xinggang Wang and Wenyu Liu and Bin Xiao},
journal={TPAMI},
year={2019}
}
UDP (CVPR'2020)
@InProceedings{Huang_2020_CVPR,
author = {Huang, Junjie and Zhu, Zheng and Guo, Feng and Huang, Guan},
title = {The Devil Is in the Details: Delving Into Unbiased Data Processing for Human Pose Estimation},
booktitle = {The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)},
month = {June},
year = {2020}
}
CMU Panoptic HandDB (CVPR'2017)
@inproceedings{simon2017hand,
title={Hand keypoint detection in single images using multiview bootstrapping},
author={Simon, Tomas and Joo, Hanbyul and Matthews, Iain and Sheikh, Yaser},
booktitle={Proceedings of the IEEE conference on Computer Vision and Pattern Recognition},
pages={1145--1153},
year={2017}
}
Results on CMU Panoptic (MPII+NZSL val set)
Arch | Input Size | PCKh@0.7 | AUC | EPE | ckpt | log |
---|---|---|---|---|---|---|
pose_hrnetv2_w18_udp | 256x256 | 0.998 | 0.742 | 7.84 | ckpt | log |
Rhd2d Dataset¶
Deeppose + Resnet on Rhd2d¶
DeepPose (CVPR'2014)
@inproceedings{toshev2014deeppose,
title={Deeppose: Human pose estimation via deep neural networks},
author={Toshev, Alexander and Szegedy, Christian},
booktitle={Proceedings of the IEEE conference on computer vision and pattern recognition},
pages={1653--1660},
year={2014}
}
ResNet (CVPR'2016)
@inproceedings{he2016deep,
title={Deep residual learning for image recognition},
author={He, Kaiming and Zhang, Xiangyu and Ren, Shaoqing and Sun, Jian},
booktitle={Proceedings of the IEEE conference on computer vision and pattern recognition},
pages={770--778},
year={2016}
}
RHD (ICCV'2017)
@TechReport{zb2017hand,
author={Christian Zimmermann and Thomas Brox},
title={Learning to Estimate 3D Hand Pose from Single RGB Images},
institution={arXiv:1705.01389},
year={2017},
note="https://arxiv.org/abs/1705.01389",
url="https://lmb.informatik.uni-freiburg.de/projects/hand3d/"
}
Results on RHD test set
Arch | Input Size | PCK@0.2 | AUC | EPE | ckpt | log |
---|---|---|---|---|---|---|
deeppose_resnet_50 | 256x256 | 0.988 | 0.865 | 3.29 | ckpt | log |
Topdown Heatmap + Mobilenetv2 on Rhd2d¶
MobilenetV2 (CVPR'2018)
@inproceedings{sandler2018mobilenetv2,
title={Mobilenetv2: Inverted residuals and linear bottlenecks},
author={Sandler, Mark and Howard, Andrew and Zhu, Menglong and Zhmoginov, Andrey and Chen, Liang-Chieh},
booktitle={Proceedings of the IEEE conference on computer vision and pattern recognition},
pages={4510--4520},
year={2018}
}
RHD (ICCV'2017)
@TechReport{zb2017hand,
author={Christian Zimmermann and Thomas Brox},
title={Learning to Estimate 3D Hand Pose from Single RGB Images},
institution={arXiv:1705.01389},
year={2017},
note="https://arxiv.org/abs/1705.01389",
url="https://lmb.informatik.uni-freiburg.de/projects/hand3d/"
}
Results on RHD test set
Arch | Input Size | PCK@0.2 | AUC | EPE | ckpt | log |
---|---|---|---|---|---|---|
pose_mobilenet_v2 | 256x256 | 0.985 | 0.883 | 2.80 | ckpt | log |
Topdown Heatmap + Resnet on Rhd2d¶
SimpleBaseline2D (ECCV'2018)
@inproceedings{xiao2018simple,
title={Simple baselines for human pose estimation and tracking},
author={Xiao, Bin and Wu, Haiping and Wei, Yichen},
booktitle={Proceedings of the European conference on computer vision (ECCV)},
pages={466--481},
year={2018}
}
ResNet (CVPR'2016)
@inproceedings{he2016deep,
title={Deep residual learning for image recognition},
author={He, Kaiming and Zhang, Xiangyu and Ren, Shaoqing and Sun, Jian},
booktitle={Proceedings of the IEEE conference on computer vision and pattern recognition},
pages={770--778},
year={2016}
}
RHD (ICCV'2017)
@TechReport{zb2017hand,
author={Christian Zimmermann and Thomas Brox},
title={Learning to Estimate 3D Hand Pose from Single RGB Images},
institution={arXiv:1705.01389},
year={2017},
note="https://arxiv.org/abs/1705.01389",
url="https://lmb.informatik.uni-freiburg.de/projects/hand3d/"
}
Results on RHD test set
Arch | Input Size | PCK@0.2 | AUC | EPE | ckpt | log |
---|---|---|---|---|---|---|
pose_hrnetv2_w18_udp | 256x256 | 0.992 | 0.902 | 2.21 | ckpt | log |
Topdown Heatmap + Hrnetv2 on Rhd2d¶
HRNetv2 (TPAMI'2019)
@article{WangSCJDZLMTWLX19,
title={Deep High-Resolution Representation Learning for Visual Recognition},
author={Jingdong Wang and Ke Sun and Tianheng Cheng and
Borui Jiang and Chaorui Deng and Yang Zhao and Dong Liu and Yadong Mu and
Mingkui Tan and Xinggang Wang and Wenyu Liu and Bin Xiao},
journal={TPAMI},
year={2019}
}
RHD (ICCV'2017)
@TechReport{zb2017hand,
author={Christian Zimmermann and Thomas Brox},
title={Learning to Estimate 3D Hand Pose from Single RGB Images},
institution={arXiv:1705.01389},
year={2017},
note="https://arxiv.org/abs/1705.01389",
url="https://lmb.informatik.uni-freiburg.de/projects/hand3d/"
}
Results on RHD test set
Arch | Input Size | PCK@0.2 | AUC | EPE | ckpt | log |
---|---|---|---|---|---|---|
pose_hrnetv2_w18 | 256x256 | 0.992 | 0.902 | 2.21 | ckpt | log |
Topdown Heatmap + Hrnetv2 + Dark on Rhd2d¶
HRNetv2 (TPAMI'2019)
@article{WangSCJDZLMTWLX19,
title={Deep High-Resolution Representation Learning for Visual Recognition},
author={Jingdong Wang and Ke Sun and Tianheng Cheng and
Borui Jiang and Chaorui Deng and Yang Zhao and Dong Liu and Yadong Mu and
Mingkui Tan and Xinggang Wang and Wenyu Liu and Bin Xiao},
journal={TPAMI},
year={2019}
}
DarkPose (CVPR'2020)
@inproceedings{zhang2020distribution,
title={Distribution-aware coordinate representation for human pose estimation},
author={Zhang, Feng and Zhu, Xiatian and Dai, Hanbin and Ye, Mao and Zhu, Ce},
booktitle={Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition},
pages={7093--7102},
year={2020}
}
RHD (ICCV'2017)
@TechReport{zb2017hand,
author={Christian Zimmermann and Thomas Brox},
title={Learning to Estimate 3D Hand Pose from Single RGB Images},
institution={arXiv:1705.01389},
year={2017},
note="https://arxiv.org/abs/1705.01389",
url="https://lmb.informatik.uni-freiburg.de/projects/hand3d/"
}
Results on RHD test set
Arch | Input Size | PCK@0.2 | AUC | EPE | ckpt | log |
---|---|---|---|---|---|---|
pose_hrnetv2_w18_dark | 256x256 | 0.992 | 0.903 | 2.17 | ckpt | log |
Topdown Heatmap + Hrnetv2 + Udp on Rhd2d¶
HRNetv2 (TPAMI'2019)
@article{WangSCJDZLMTWLX19,
title={Deep High-Resolution Representation Learning for Visual Recognition},
author={Jingdong Wang and Ke Sun and Tianheng Cheng and
Borui Jiang and Chaorui Deng and Yang Zhao and Dong Liu and Yadong Mu and
Mingkui Tan and Xinggang Wang and Wenyu Liu and Bin Xiao},
journal={TPAMI},
year={2019}
}
UDP (CVPR'2020)
@InProceedings{Huang_2020_CVPR,
author = {Huang, Junjie and Zhu, Zheng and Guo, Feng and Huang, Guan},
title = {The Devil Is in the Details: Delving Into Unbiased Data Processing for Human Pose Estimation},
booktitle = {The IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)},
month = {June},
year = {2020}
}
RHD (ICCV'2017)
@TechReport{zb2017hand,
author={Christian Zimmermann and Thomas Brox},
title={Learning to Estimate 3D Hand Pose from Single RGB Images},
institution={arXiv:1705.01389},
year={2017},
note="https://arxiv.org/abs/1705.01389",
url="https://lmb.informatik.uni-freiburg.de/projects/hand3d/"
}
Results on CMU Panoptic (MPII+NZSL val set)
Arch | Input Size | PCKh@0.7 | AUC | EPE | ckpt | log |
---|---|---|---|---|---|---|
pose_hrnetv2_w18_udp | 256x256 | 0.998 | 0.742 | 7.84 | ckpt | log |