@inproceedings{3216a1c1022c4515a2c52cd9116ecd1c,
title = "Multispectral Feature-Fusion Object Detection Based on Multi-Scale Auxiliary Branch",
abstract = "Object detection in real-world environments is inherently challenging due to various factors, such as poor illumination conditions, which can significantly hinder detection accuracy. To overcome the above challenges, we propose a multispectral feature-fusion object detection framework by designing a dual-modal backbone based on YOLOv8. Within the backbone, we propose a Feature Reconstruction Fusion module based on the Swin Transformer, which reconstructs dual-modal features by considering the intensity of spatial information and learns complementary inter-modal information. Moreover, we design multi-scale auxiliary branches during the training stage to complement the single-modal gradient information at different levels, strengthening the model's ability to recognize multi-scale targets. Our method is tested on several public datasets, including the FLIR-aligned, LLVIP, and M3FD datasets. The results show that our network not only achieves remarkable accuracy in detecting small-sized targets but also outperforms other state-of-the-art networks in mean average precision.",
keywords = "auxiliary branch, multispectral object detection, Swin Transformer, YOLOv8",
author = "Kangdi Yin and Weixing Li and Ziyi Zheng and Hao Zhang and Feng Pan and Xiaoxue Feng",
note = "Publisher Copyright: {\textcopyright} 2025 Technical Committee on Control Theory, Chinese Association of Automation.; 44th Chinese Control Conference, CCC 2025 ; Conference date: 28-07-2025 Through 30-07-2025",
year = "2025",
doi = "10.23919/CCC64809.2025.11178534",
language = "English",
series = "Chinese Control Conference, CCC",
publisher = "IEEE Computer Society",
pages = "7727--7732",
editor = "Jian Sun and Hongpeng Yin",
booktitle = "Proceedings of the 44th Chinese Control Conference, CCC 2025",
address = "United States",
}