@inproceedings{f94e6eb6a2574dbca475be60ed831559,
title = "TreeNet: A hierarchical deep learning model to facilitate edge intelligence for resource-constrained devices",
abstract = "Deep learning has achieved remarkable successes in various areas such as computer vision and natural language processing. Many sophisticated models have been proposed to improve performance by designing a significant number of layers of neurons. As an emerging research area, edge intelligence tries to bring intelligence to the network edge by integrating edge computing and AI technologies and it has gained wide attention for its lower latency and better privacy preservation features. Nevertheless, training and inferencing deep neural networks require intensive computation power and time, making it quite challenging to run the models on the resource-constrained edge devices. In this paper, we propose a deep learning model, namely TreeNet, based on task decomposition. After obtaining a task, we would not fit the entire task but decompose the task into disjoint sub-tasks to reduce the complexity of the required deep learning model (it could be divided multiple times if necessary). We first fit the original dataset mapping to different sub-tasks and then fit the mapping of each sub-task to the category of the original dataset that it contains. During the running of the model, we dynamically call the low-level classifier based on the inference result of the high-level classifier. When the inference result of the high-level classifier is unreliable, we send the input sample to the cloud server for processing. We use several popular datasets to study the TreeNet architecture and show that it can process most of the input data while achieving high inference accuracy and significantly decreasing the total amount of calculation.",
keywords = "deep learning, edge computing, edge intelligence, model acceleration, model compression, resource-constrained",
author = "Dong Lu and Yanlong Zhai and Jianqing Wu and Jun Shen",
note = "Publisher Copyright: {\textcopyright} 2021 IEEE.; 21st IEEE/ACM International Symposium on Cluster, Cloud and Internet Computing, CCGrid 2021 ; Conference date: 10-05-2021 Through 13-05-2021",
year = "2021",
month = may,
doi = "10.1109/CCGrid51090.2021.00062",
language = "English",
series = "Proceedings - 21st IEEE/ACM International Symposium on Cluster, Cloud and Internet Computing, CCGrid 2021",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "525--534",
editor = "Laurent Lefevre and Stacy Patterson and Lee, \{Young Choon\} and Haiying Shen and Shashikant Ilager and Mohammad Goudarzi and Toosi, \{Adel N.\} and Rajkumar Buyya",
booktitle = "Proceedings - 21st IEEE/ACM International Symposium on Cluster, Cloud and Internet Computing, CCGrid 2021",
address = "United States",
}