@inproceedings{483289911b2c43debe800edb8c84283d,
title = "Design and Implementation of CNN Accelerator Based on FPGA",
abstract = "As one of the important research directions in the field of computer vision, CNN based object detection methods are constantly being updated, which puts higher requirements on the computational performance of hardware acceleration platforms. FPGA achieves a balance between acceleration performance, power consumption, and configurability, making it a good compromise for hardware accelerator platform options. Based on this, this paper implements a FPGA-based CNN accelerator with certain universality by designing universal operators. This paper mainly uses ping-pong buffer mechanism to optimize the loading of parameters and data and at the same time uses pipeline to optimize the calculation. Based on the concept of reverse positioning and sequence calculation, the operator is designed to achieve weight reuse and output feature map calculation. YOLOv4-Tiny is built on ZYNQ7020 for verification, which has an acceleration ratio of 1162 compared to using only the ARM processor and has an energy efficiency ratio of 2.847GOPS/W compared to GPU's 2.311GOPS/W.",
keywords = "CNN Accelerator, FPGA, Universal Operators, YOLOv4-Tiny",
author = "Xin Guan and Zhanqing Wang and Hao Fang",
note = "Publisher Copyright: {\textcopyright} 2024 Technical Committee on Control Theory, Chinese Association of Automation.; 43rd Chinese Control Conference, CCC 2024 ; Conference date: 28-07-2024 Through 31-07-2024",
year = "2024",
doi = "10.23919/CCC63176.2024.10661893",
language = "English",
series = "Chinese Control Conference, CCC",
publisher = "IEEE Computer Society",
pages = "8969--8974",
editor = "Jing Na and Jian Sun",
booktitle = "Proceedings of the 43rd Chinese Control Conference, CCC 2024",
address = "United States",
}