@inproceedings{fc904a04e3a3419683710468e453c08a,
title = "A Platform Independent Model Design and Adaptation for Edge Intelligence",
abstract = "Along with the rapid developments in deep learning and edge computing technologies, deploying models on mobile devices is a trend for modern applications. However, the resource-constrained and heterogeneous edge devices fail to cope with complicated model inference. To tackle this challenge, this study explores the platform independent model design based on Open Neural Network Exchange. Then we quantize the existing heavy deep learning models into lightweight ones by applying low-precision arithmetic and partitioning the computational graph into sub-graphs for parallel execution and hardware-based acceleration on heterogeneous systems. This study evaluates the efficiency and effectiveness among different quantization settings and analyses the impacts for model acceleration. The experiments show that the quantized models with uint8 type computation perform faster inference while still preserve high performance. This result suggests a novel solution for the research on edge intelligence.",
keywords = "Edge Computing, Edge Intelligence, IoT, Model Inference, ONNX, Quantization",
author = "Chaolong Zhang and Jiliu Zhou and Jia He and Zhijie Xu and Jin Jin and Chao Kong and Yuanping Xu and Benjun Guo and Qiuyan Gai",
note = "Publisher Copyright: {\textcopyright} 2024 IEEE.; 29th International Conference on Automation and Computing, ICAC 2024 ; Conference date: 28-08-2024 Through 30-08-2024",
year = "2024",
doi = "10.1109/ICAC61394.2024.10718820",
language = "English",
series = "ICAC 2024 - 29th International Conference on Automation and Computing",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
booktitle = "ICAC 2024 - 29th International Conference on Automation and Computing",
}