@inproceedings{3a5d0e5375e849de86790b8dacf3d065,
title = "GCVNet: Geometry Constrained Voting Network to Estimate 3D Pose for Fine-Grained Object Categories",
abstract = "As a fundamental AI problem, monocular 3D pose estimation has received much attention. This paper addresses the challenge of estimating full perspective model parameters, including object pose and camera intrinsics, from a single 2D image of fine-grained object categories. To tackle this highly ill-posed problem, we propose a Geometry Constrained Voting Network (GCVNet). It is a unified end-to-end network consisting of four synergic task-specific subnetworks: 1) Fine-grained classification subnetwork, offering fine-grained 3D shape priors. 2) Voting subnetwork, generating 2D measurements. 3) Segmentation subnetwork, providing a foreground mask for voting. 4) PnP subnetwork, estimating the perspective parameters via explicit geometric reasoning, as well as constraining the classification subnetwork to provide proper 3D priors and the voting subnetwork to generate a group of geometric consistent 2D measurements, rather than independent voting for each 2D measurement in the literature. Experiments on challenging datasets demonstrate the superior performance of GCVNet.",
keywords = "Differentiable PnP, Geometric reasoning, Pose estimation",
author = "Yaohang Han and Huijun Di and Hanfeng Zheng and Jianyong Qi and Jianwei Gong",
note = "Publisher Copyright: {\textcopyright} 2020, Springer Nature Switzerland AG.; 3rd Chinese Conference on Pattern Recognition and Computer Vision, PRCV 2020 ; Conference date: 16-10-2020 Through 18-10-2020",
year = "2020",
doi = "10.1007/978-3-030-60633-6_15",
language = "English",
isbn = "9783030606329",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "180--192",
editor = "Yuxin Peng and Hongbin Zha and Qingshan Liu and Huchuan Lu and Zhenan Sun and Chenglin Liu and Xilin Chen and Jian Yang",
booktitle = "Pattern Recognition and Computer Vision - 3rd Chinese Conference, PRCV 2020, Proceedings",
address = "Germany",
}