@inproceedings{df640a9772164bf197524214086a9c1d,
title = "YOLO-FS: a unified framework for object detection and semantic segmentation",
abstract = "The integration of object detection and semantic segmentation leverages the advantages of object localization and pixel-level semantic understanding to provide enhanced environment awareness for robot navigation and autonomous driving systems. In this paper, we propose an innovative model that combines YOLOv5 for object detection with a Fast-SCNNbased semantic segmentation module to form a unified framework capable of performing both object detection and semantic segmentation tasks. The model is trained and tested on public and homemade dataset, and validated using camera data collected from self-driving vehicles and quadruped robots. The experimental results show that the model has a mAP50 of 48.3\% an improvement of 1.6\% over the original algorithm, and the segmentation mean intersection rate (MIoU) on the public dataset is 70.6\% an improvement of 2.5\% over the original algorithm. On the homemade dataset, the performance of the model improved significantly with vehicle detection accuracy of more than 90\% and average intersection joint rate of 89.3\%. These findings indicate that the model can effectively enhance perception in complex environments and provide key support for safer and more efficient autonomous navigation.",
keywords = "autonomous vehicles, convolutional neural networks, object detection, quadruped robots, semantic segmentation",
author = "Chengxiang Li and Weimin Zhang and Fangxing Li and Shicheng Fan and Meijun Guo and Xiaohai He",
note = "Publisher Copyright: {\textcopyright} 2025 SPIE.; 2024 International Conference on Computer Graphics, Artificial Intelligence, and Data Processing, ICCAID 2024 ; Conference date: 13-12-2024 Through 15-12-2024",
year = "2025",
doi = "10.1117/12.3061480",
language = "English",
series = "Proceedings of SPIE - The International Society for Optical Engineering",
publisher = "SPIE",
editor = "Xin Xu and Zain, \{Azlan bin Mohd\}",
booktitle = "International Conference on Computer Graphics, Artificial Intelligence, and Data Processing, ICCAID 2024",
address = "United States",
}