@inproceedings{69dd9cda475c4ec389a22c7f69604075,
title = "Cap-CasMVSNet:Capsul-based Cascade Cost Volume for Multi-View Stereo Network",
abstract = "Currently deep learning has been widely used in multi-view stereo, but there is still room for optimization. In this paper, we propose a capsule network-based multi-view stereo network, namely Cap-CasMVSNet. We first introduce a transformer-based filter to highlight the foreground part of the feature. Then aiming at the shortcomings of the fixed receptive field of the traditional convolution kernel, we added a deformable convolution module to the network to enable the convolution to adapt to geometric deformation. We use a capsule neuron to handle global semantic connections between high-level features. Finally, we achieve competitive results on the DTU dataset, showing strong robustness.",
keywords = "capsule network, multi-view stereo, transformer",
author = "Hongmin Zhou and Yuan Li",
note = "Publisher Copyright: {\textcopyright} 2023 IEEE.; 38th Youth Academic Annual Conference of Chinese Association of Automation, YAC 2023 ; Conference date: 27-08-2023 Through 29-08-2023",
year = "2023",
doi = "10.1109/YAC59482.2023.10401477",
language = "English",
series = "Proceedings - 2023 38th Youth Academic Annual Conference of Chinese Association of Automation, YAC 2023",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "59--63",
booktitle = "Proceedings - 2023 38th Youth Academic Annual Conference of Chinese Association of Automation, YAC 2023",
address = "United States",
}